{"id":17391,"updated":"2025-01-22T23:21:45.089521+00:00","links":{},"created":"2025-01-18T22:50:24.325347+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00017391","sets":["934:1022:1023:1026"]},"path":["1026"],"owner":"1","recid":"17391","title":["ブートストラップ式同位語辞書構築における検索効率の向上"],"pubdate":{"attribute_name":"公開日","attribute_value":"2008-06-26"},"_buckets":{"deposit":"480d2602-bef8-4668-8244-00edca1aeb4b"},"_deposit":{"id":"17391","pid":{"type":"depid","value":"17391","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"ブートストラップ式同位語辞書構築における検索効率の向上","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"ブートストラップ式同位語辞書構築における検索効率の向上"},{"subitem_title":"Cost-effective Search Strategy for Bootstrapping Lexicon Acquisition","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"研究論文","subitem_subject_scheme":"Other"}]},"item_type_id":"3","publish_date":"2008-06-26","item_3_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"NEC C&Cイノベーション研究所"},{"subitem_text_value":"NEC共通基盤ソフトウェア研究所"},{"subitem_text_value":"NEC共通基盤ソフトウェア研究所"},{"subitem_text_value":"NEC C&Cイノベーション研究所"},{"subitem_text_value":"NEC C&Cイノベーション研究所"}]},"item_3_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"NEC C&C Innovation Research Laboratories","subitem_text_language":"en"},{"subitem_text_value":"NEC Common Platform Software Research Laboratories","subitem_text_language":"en"},{"subitem_text_value":"NEC Common Platform Software Research Laboratories","subitem_text_language":"en"},{"subitem_text_value":"NEC C&C Innovation Research Laboratories","subitem_text_language":"en"},{"subitem_text_value":"NEC C&C Innovation Research Laboratories","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/17391/files/IPSJ-TOD0101005.pdf"},"date":[{"dateType":"Available","dateValue":"2010-06-26"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-TOD0101005.pdf","filesize":[{"value":"552.6 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"13"},{"tax":["include_tax"],"price":"0","billingrole":"39"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"d6251b95-687c-4cb5-8708-e2a5cbb57092","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2008 by the Information Processing Society of Japan"}]},"item_3_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"河合, 英紀"},{"creatorName":"水口, 弘紀"},{"creatorName":"土田, 正明"},{"creatorName":"國枝, 和雄"},{"creatorName":"山田, 敬嗣"}],"nameIdentifiers":[{}]}]},"item_3_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Hideki, Kawai","creatorNameLang":"en"},{"creatorName":"Hironori, Mizuguchi","creatorNameLang":"en"},{"creatorName":"Masaaki, Tsuchida","creatorNameLang":"en"},{"creatorName":"Kazuo, Kunieda","creatorNameLang":"en"},{"creatorName":"Keiji, Yamada","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_3_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA11464847","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_3_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7799","subitem_source_identifier_type":"ISSN"}]},"item_3_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本稿では,同一の意味的階層に属する単語集合(同位語辞書)を高い検索効率でWebから抽出する方法を提案する.近年,Web 上に散在した知識を収集するアプローチの1 つとしてブートストラップ式同位語辞書構築手法が注目を集めている.サーチエンジンが提供する検索API は知識収集の強力なツールである.しかし,検索API を通じて大量の検索を行うことは,サーチエンジンに過剰な負荷をかけてしまうことになる.そのため,サーチエンジン側でも検索API を通じた検索回数を制限している.そこで本稿では,検索回数をコストとして考慮し,なるべく少ない検索回数でより多くの同位語を収集可能な検索戦略を求めることを目標とする.実験の結果,合計2 000回の検索で10 万語以上のキーワードを適合率0.9 以上で抽出することができた.","subitem_description_type":"Other"}]},"item_3_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"In this paper, we propose a cost-effective search strategy framework to extract keywords in the same semantic class from the Web. Constructing a dictionary based on the bootstrapping technique is one of the promising approaches to harnessing knowledge scattered around the Web. Open web application programming interfaces (APIs) are powerful tools for the knowledge-gathering process. However, we have to consider the cost of API calls because too many queries can overload the search engines, and they also limited the number of API calls. Our goal is to optimize a search strategy that can collect as many new words as possible with the least API calls. Our results shows that the optimized search strategy can extract more than 100,000 words with a precision of 0.90 by with only 2,000 search API calls.","subitem_description_type":"Other"}]},"item_3_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"48","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌データベース(TOD)"}],"bibliographicPageStart":"36","bibliographicIssueDates":{"bibliographicIssueDate":"2008-06-26","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"1","bibliographicVolumeNumber":"1"}]},"relation_version_is_last":true,"weko_creator_id":"1"}}