{"created":"2025-01-18T22:51:40.670889+00:00","updated":"2025-01-22T22:22:53.044092+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00019128","sets":["1164:1165:1179:1182"]},"path":["1182"],"owner":"1","recid":"19128","title":["テキスト構文構造類似度を用いた類似文検索手法"],"pubdate":{"attribute_name":"公開日","attribute_value":"2005-05-19"},"_buckets":{"deposit":"7403d740-cb76-49fa-a6c9-92edb04b34c5"},"_deposit":{"id":"19128","pid":{"type":"depid","value":"19128","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"テキスト構文構造類似度を用いた類似文検索手法","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"テキスト構文構造類似度を用いた類似文検索手法"},{"subitem_title":"New methods to retrieve sentences based on syntactic similarity","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2005-05-19","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京工業大学 大学院情報理工学研究科 計算工学専攻"},{"subitem_text_value":"東京工業大学 大学院情報理工学研究科 計算工学専攻"},{"subitem_text_value":"東京工業大学 大学院情報理工学研究科 計算工学専攻"},{"subitem_text_value":"中京大学 情報科学部 認知科学科"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Department of Computer Science Graduate School of Information Science and Engineering Tokyo Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Department of Computer Science Graduate School of Information Science and Engineering Tokyo Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Department of Computer Science Graduate School of Information Science and Engineering Tokyo Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Cognitive Science Major Graduate School of Computer and Cognitive Sciences Chukyo University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/19128/files/IPSJ-DBS05136006.pdf"},"date":[{"dateType":"Available","dateValue":"2007-05-19"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-DBS05136006.pdf","filesize":[{"value":"303.0 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"13"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"5b1ba1e9-f6d4-4ba1-aa49-8c6ff1dbece9","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2005 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"市川, 宙"},{"creatorName":"橋本, 泰一"},{"creatorName":"徳永, 健伸"},{"creatorName":"田中, 穂積"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Hiroshi, Ichikawa","creatorNameLang":"en"},{"creatorName":"Taiichi, Hashimoto","creatorNameLang":"en"},{"creatorName":"Takenobu, Tokunaga","creatorNameLang":"en"},{"creatorName":"Hozumi, Tanaka","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10112482","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本論文では,構文木付きコーパスから,構文的に類似した文を検索する手法を提案した.構文的類似度の計算手法としてはTree Kernel (Collins)が提案されている.しかし,Tree Kernelの類似度計算は時間を要するため,これを類似文検索に応用すると,検索速度が問題になる.検索時間短縮のためには,予め検索対象のインデックスを作成しておくのが一般的だが,Tree Kernelではその性質上,検索対象のインデックス化が困難である.そこで,Tree Kernelを近似する高速な新しいアルゴリズムとしてTree OverlappingとSubpath Setを提案した.これらのアルゴリズムは,Tree Kernelとは異なり,検索対象のインデックス化が可能なため,高速な検索が可能である.本論文ではTree Kernel  Tree Overlapping  Subpath Setの3種類のアルゴリズムについて述べ,実験結果を示し,比較した.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This paper proposes a method to retrieve sentences which have a similar syntactic structure to the syntax tree of the query sentence. Tree Kernel has been proposed by Collins as a method to calculate structural similarity. However, the similarity retrieval by Tree Kernel is not practicable because Tree Kernel computation requires significant resources. A general method to shorten the retrieving time and to reduce required computation is indexing the corpora beforehand. However, in case of Tree Kernel, it is too hard to index the corpora. Therefore, we propose faster approximation algorithms: Tree Overlapping and Subpath Set. These algorithms are faster than Tree Kernel because indexing is possible. This paper describes three algorithms: Tree Kernel, Tree Overlapping and Subpath Set, and shows the result of evaluations and algorithm comparison.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"46","bibliographic_titles":[{"bibliographic_title":"情報処理学会研究報告データベースシステム(DBS)"}],"bibliographicPageStart":"39","bibliographicIssueDates":{"bibliographicIssueDate":"2005-05-19","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"42(2005-DBS-136)","bibliographicVolumeNumber":"2005"}]},"relation_version_is_last":true,"weko_creator_id":"1"},"id":19128,"links":{}}