{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00095325","sets":["934:1022:7036:7274"]},"path":["7274"],"owner":"11","recid":"95325","title":["文書の更新を考慮した高精度XML部分文書検索手法の提案"],"pubdate":{"attribute_name":"公開日","attribute_value":"2013-09-27"},"_buckets":{"deposit":"35614bef-aa84-49f3-b3d9-960a841d272b"},"_deposit":{"id":"95325","pid":{"type":"depid","value":"95325","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"文書の更新を考慮した高精度XML部分文書検索手法の提案","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"文書の更新を考慮した高精度XML部分文書検索手法の提案"},{"subitem_title":"A Proposal of Accurate XML Element Retrieval Considering Document Updates","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"[研究論文] XML部分文書検索,文書索引,差分更新,大域的重み,性能評価","subitem_subject_scheme":"Other"}]},"item_type_id":"3","publish_date":"2013-09-27","item_3_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"奈良先端科学技術大学院大学情報科学研究科/日本学術振興会"},{"subitem_text_value":"奈良先端科学技術大学院大学情報科学研究科"},{"subitem_text_value":"同志社大学文化情報学部"},{"subitem_text_value":"奈良先端科学技術大学院大学情報科学研究科"},{"subitem_text_value":"奈良先端科学技術大学院大学情報科学研究科"},{"subitem_text_value":"奈良先端科学技術大学院大学情報科学研究科"}]},"item_3_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Information Science, Nara Institute of Science and Technology / Japan Society for the Promotion of Science","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Information Science, Nara Institute of Science and Technology","subitem_text_language":"en"},{"subitem_text_value":"Faculty of Culture and Information Science, Doshisha University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Information Science, Nara Institute of Science and Technology","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Information Science, Nara Institute of Science and Technology","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Information Science, Nara Institute of Science and Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/95325/files/IPSJ-TOD0604002.pdf"},"date":[{"dateType":"Available","dateValue":"2015-09-27"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-TOD0604002.pdf","filesize":[{"value":"1.2 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"13"},{"tax":["include_tax"],"price":"0","billingrole":"39"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"c6a130f4-d81f-4e8a-8128-7fb278cfa070","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2013 by the Information Processing Society of Japan"}]},"item_3_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"欅, 惇志"},{"creatorName":"宮崎, 純"},{"creatorName":"波多野, 賢治"},{"creatorName":"山本, 豪志朗"},{"creatorName":"武富, 貴史"},{"creatorName":"加藤, 博一"}],"nameIdentifiers":[{}]}]},"item_3_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Atsushi, Keyaki","creatorNameLang":"en"},{"creatorName":"Jun, Miyazaki","creatorNameLang":"en"},{"creatorName":"Kenji, Hatano","creatorNameLang":"en"},{"creatorName":"Goshiro, Yamamoto","creatorNameLang":"en"},{"creatorName":"Takafumi, Taketomi","creatorNameLang":"en"},{"creatorName":"Hirokazu, Kato","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_3_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA11464847","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_3_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7799","subitem_source_identifier_type":"ISSN"}]},"item_3_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本論文では,文書の更新を考慮した高精度XML部分文書検索の実現を目指す.検索システムにおいて,文書の更新に対応しなかった場合,適切な検索結果を提示できず検索システムの利便性が低下するが,文書の更新発生時に検索索引を一から再構築した場合には索引構築時間が長時間に及ぶため,本論文では索引の差分更新を行う.しかし,索引の差分更新時に,システムに蓄積された文書数が十分ではない時点や,文書の更新にともなって語の統計量が変化した場合,文書集合全体から算出される統計量である大域的重みを正確に推定できない可能性がある.これらの問題を解決するため,既存のXML部分文書検索システムに索引の差分更新機能を付与し,さらに,高速な差分更新を行うために文書中の重要な箇所と索引語のみを索引へ追加するためのフィルタと,正確な大域的重み推定のためのpath式統合手法を用いた索引語の重み付け手法を提案する.評価実験の結果,統計量が変動しない文書集合に対して,提案手法は単純な差分更新と比較し,検索精度を4%向上させつつ,索引の更新速度を25%高速化した.また,統計量が変動した場合にも,速やかにその変化に追従して検索精度を向上させることが可能であることが判明した.","subitem_description_type":"Other"}]},"item_3_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"In this paper, we propose a method for accurately retrieving XML elements considering document updates. If document updates are not handled in a search system, users cannot obtain appropriate search results, which reduces the usefulness of the search system. We apply an incremental approach to update an index because a rebuild-from-scratch approach takes longer time. In addition, global weights, i.e., the statistics computed with all documents in the search system, may not be accurate when a few number of documents is indexed or when global weights change drastically. To solve these problems, we propose to extend a function of incremental updates of indices to general XML element retrieval systems, with filters to reduce the update cost by eliminating unimportant elements and terms. Moreover, we apply a method for integrating path expression which estimates accurate global weights in term calculation. Experimental results showed that our proposed method can be up to 25% faster to update indices than the simple incremental updates and can improve the search accuracy by 4% with document set of static statistics. The proposed method can also search accurately, even under continuous changes in the statistics of the documents.","subitem_description_type":"Other"}]},"item_3_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"16","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌データベース(TOD)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2013-09-27","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"4","bibliographicVolumeNumber":"6"}]},"relation_version_is_last":true,"weko_creator_id":"11"},"id":95325,"updated":"2025-01-21T13:56:03.400845+00:00","links":{},"created":"2025-01-18T23:42:26.706714+00:00"}