{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00062572","sets":["1164:3500:5611:5728"]},"path":["5728"],"owner":"10","recid":"62572","title":["Web上の人名検索結果の同姓同名問題における二段階クラスタリングを用いた再現率向上"],"pubdate":{"attribute_name":"公開日","attribute_value":"2009-07-21"},"_buckets":{"deposit":"baebd051-eb4f-4135-9b4d-a846d0a74f23"},"_deposit":{"id":"62572","pid":{"type":"depid","value":"62572","revision_id":0},"owners":[10],"status":"published","created_by":10},"item_title":"Web上の人名検索結果の同姓同名問題における二段階クラスタリングを用いた再現率向上","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Web上の人名検索結果の同姓同名問題における二段階クラスタリングを用いた再現率向上"},{"subitem_title":"Improvement Recall of Person Name Disambiguation on the Web People Search by TwoStage Clustering","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"クラスタリング","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2009-07-21","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京大学大学院情報理工学系研究科"},{"subitem_text_value":"東京大学大学院情報理工学系研究科"},{"subitem_text_value":"東京大学大学院情報理工学系研究科"},{"subitem_text_value":"東京大学情報基盤センター"},{"subitem_text_value":"東京大学情報基盤センター"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Information Science and Technology, The University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Information Science and Technology, The University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Information Science and Technology, The University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"Information Technology Center, The University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"Information Technology Center, The University of Tokyo","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/62572/files/IPSJ-FI09095006.pdf"},"date":[{"dateType":"Available","dateValue":"2011-07-21"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-FI09095006.pdf","filesize":[{"value":"153.5 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"39"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"72b8918b-6942-444c-bd48-d59797891c51","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2009 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"池田, 雅紀"},{"creatorName":"小野, 真吾"},{"creatorName":"佐藤, 一誠"},{"creatorName":"吉田, 稔"},{"creatorName":"中川, 裕志"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Masaki, Ikeda","creatorNameLang":"en"},{"creatorName":"Shingo, Ono","creatorNameLang":"en"},{"creatorName":"Issei, Sato","creatorNameLang":"en"},{"creatorName":"Minoru, Yoshida","creatorNameLang":"en"},{"creatorName":"Hiroshi, Nakagawa","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10114171","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"教師なし学習によるクラスタリングに対して,半教師有り学習を適用する手法について提案する.クラスターの評価基準において,結果のクラスターにおける正解データの割合を表す適合率と正解データが結果のクラスターに含まれている割合を表す再現率が存在する.従来研究において,素性の種類を限定することによって特に高い適合率を持つクラスターを生成することが可能になった.これらの素性は疎であり,再現率を向上させることは困難である.一方,素性の中には,人物を識別する能力は弱いが,文書に含まれている数の多い素性が存在する.我々は半教師有り学習を適合率の高いクラスターに対して適用し,クラスターの再現率の向上させることを提案する.本研究では,ブートストラップ法として知られている Espresso を応用し,人名曖昧解消における半教師有り学習として用いる.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This research proposes the application of semi-supervised learning to unsu- pervsed clustering. There are two criteria of cluster evaluation, or precision and recall. Precision is the ratio of true datas in the result cluster and recall is the ratio of true datas the result cluster has to all true data. In previous work, the selection of feature types enables to make high precision clusters, but these fea- tures are too sparse to imporve recall. On the otherhand, there are features that has poor discrimination capacity but are thick in the documents. We suggest to applicate semi-supervised learning to these high precision clusters and advance clusters' recall. In this research, we use Espresso that is bootstrap method in the information extraction for person name disambiguation as semi-supervised learning method.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"8","bibliographic_titles":[{"bibliographic_title":"研究報告情報学基礎(FI)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2009-07-21","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"6","bibliographicVolumeNumber":"2009-FI-95"}]},"relation_version_is_last":true,"weko_creator_id":"10"},"id":62572,"updated":"2025-01-22T02:33:44.562173+00:00","links":{},"created":"2025-01-18T23:24:30.186485+00:00"}