{"created":"2025-01-18T22:50:30.210690+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00017525","sets":["934:1022:1039:1043"]},"path":["1043"],"owner":"1","recid":"17525","title":["文書情報統合のためのテキスト表現モデルの提案と主題グラフを用いた実現"],"pubdate":{"attribute_name":"公開日","attribute_value":"2005-03-15"},"_buckets":{"deposit":"b1de051a-52b7-488a-a0a8-43c3ee15a92e"},"_deposit":{"id":"17525","pid":{"type":"depid","value":"17525","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"文書情報統合のためのテキスト表現モデルの提案と主題グラフを用いた実現","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"文書情報統合のためのテキスト表現モデルの提案と主題グラフを用いた実現"},{"subitem_title":"Text Representation Model for Integrating Document Contents and Its Implementation Using Subject Graphs","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"研究論文","subitem_subject_scheme":"Other"}]},"item_type_id":"3","publish_date":"2005-03-15","item_3_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"日本電信電話株式会社NTT サイバーソリューション研究所"},{"subitem_text_value":"日本電信電話株式会社NTT サイバーソリューション研究所"},{"subitem_text_value":"日本電信電話株式会社NTT サイバーソリューション研究所"},{"subitem_text_value":"日本電信電話株式会社NTT サイバーソリューション研究所"}]},"item_3_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"NTT Cyber Solutions Laboratories NTT Corporation","subitem_text_language":"en"},{"subitem_text_value":"NTT Cyber Solutions Laboratories NTT Corporation","subitem_text_language":"en"},{"subitem_text_value":"NTT Cyber Solutions Laboratories NTT Corporation","subitem_text_language":"en"},{"subitem_text_value":"NTT Cyber Solutions Laboratories NTT Corporation","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/17525/files/IPSJ-TOD4605007.pdf"},"date":[{"dateType":"Available","dateValue":"2007-03-15"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-TOD4605007.pdf","filesize":[{"value":"328.3 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"13"},{"tax":["include_tax"],"price":"0","billingrole":"39"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"b53bf7ca-47a0-4dc7-8655-6dfa573cf39e","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2005 by the Information Processing Society of Japan"}]},"item_3_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"富田, 準二"},{"creatorName":"石井, 恵"},{"creatorName":"中渡瀬, 秀一"},{"creatorName":"片岡, 良治"}],"nameIdentifiers":[{}]}]},"item_3_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Junji, Tomita","creatorNameLang":"en"},{"creatorName":"Megumi, Ishii","creatorNameLang":"en"},{"creatorName":"Hidekazu, Nakawatase","creatorNameLang":"en"},{"creatorName":"Ryoji, Kataoka","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_3_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA11464847","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_3_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7799","subitem_source_identifier_type":"ISSN"}]},"item_3_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"複数の文書の内容を統合することによって,単一の文書からは得られないような重要な情報を取得することができる.このような文書情報の統合を行うためには,検索,分類等の様々なテキスト操作を柔軟に組み合わせて実行する必要がある.本稿では,リレーショナルデータモデルとのアナロジを用いたテキスト表現モデルを提案する.テキスト表現モデルは,文書を形式的な表現(テキスト表現)で表し,これらテキスト表現のリストに対する演算からなるテキスト操作の体系(テキスト表現代数)を提供する.テキスト表現に,単語の重要度をノードの重み,単語間の関連度をリンクの重みとした主題グラフを採用し,主題グラフに基づくテキスト用のデータベースおよび文書情報統合アプリケーションを構築する.その動作例を用いて,主題グラフに対する演算の組合せによって,有用な情報が得られることを示すとともに,テキスト表現モデルのカバー範囲を明らかにする.さらに,主題グラフが,一般に広く利用されているタームベクトルよりもテキスト表現として適していることを,演算のタスク適用性および分析結果の可読性の観点から示す.また,計算量に関する考察から主題グラフが大規模文書集合にも適用可能であることを示す.","subitem_description_type":"Other"}]},"item_3_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"Integrating the contents of several documents reveals important facts, that can not be acquired from a single document. The integration requires heterogeneous combinations of text handling operations such as text search and clustering. Drawing an analogy with the relational data model, we propose a text representation model that represents documents in a formal manner, i.e. text representation, and that provides a text representation algebra that consists of procedures for handling the lists of the representations. We use subject graphs as the representation; node weight is used to represent the significance of each term, and link weight is used to represent that of each term-term association. This paper introduces a graphbased text database based on the model and an application for integrating document contents. Examples show that the proposed technique can discover important facts. Furthermore, evaluations show that subject graphs are more suitable for representation than term vectors with regard to the ap licability of procedures and readability. We also show the limitations of the model and that the computational complexity of subject graphs is reasonable.","subitem_description_type":"Other"}]},"item_3_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"83","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌データベース(TOD)"}],"bibliographicPageStart":"70","bibliographicIssueDates":{"bibliographicIssueDate":"2005-03-15","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"SIG5(TOD25)","bibliographicVolumeNumber":"46"}]},"relation_version_is_last":true,"weko_creator_id":"1"},"links":{},"id":17525,"updated":"2025-01-22T23:17:08.785081+00:00"}