{"updated":"2025-01-23T01:03:26.298081+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00013848","sets":["581:755:760"]},"path":["760"],"owner":"1","recid":"13848","title":["人名のかな表記のゆれに基づく近似文字列照合法"],"pubdate":{"attribute_name":"公開日","attribute_value":"1995-08-15"},"_buckets":{"deposit":"3b7afa2a-169d-4529-bdc3-bb7bbf5a21d2"},"_deposit":{"id":"13848","pid":{"type":"depid","value":"13848","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"人名のかな表記のゆれに基づく近似文字列照合法","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"人名のかな表記のゆれに基づく近似文字列照合法"},{"subitem_title":"Approximate String Matching Based on Kana Variants of Names","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"論文","subitem_subject_scheme":"Other"}]},"item_type_id":"2","publish_date":"1995-08-15","item_2_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"NTT情報通信研究所知的情報処理研究部"},{"subitem_text_value":"豊橋技術科学大学情報工学系"}]},"item_2_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Intelligent Information Systems Laboratory, NTT Information and Communication Systems Laboratories","subitem_text_language":"en"},{"subitem_text_value":"Department of Information and Computer Sciences, Toyohashi University of Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/13848/files/IPSJ-JNL3608016.pdf"},"date":[{"dateType":"Available","dateValue":"1997-08-15"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-JNL3608016.pdf","filesize":[{"value":"1.2 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"8"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"de458249-d6b7-43e3-8202-bb9f8470dfbc","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 1995 by the Information Processing Society of Japan"}]},"item_2_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"高橋, 克巳"},{"creatorName":"梅村, 恭司"}],"nameIdentifiers":[{}]}]},"item_2_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Katsumi, Takahashi","creatorNameLang":"en"},{"creatorName":"Kyoji, Umemura","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_2_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN00116647","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_2_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7764","subitem_source_identifier_type":"ISSN"}]},"item_2_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"日本人名のかな表記にゆれとよばれる変形が存在し、日本語情報検索システムの問題となっている。本論文では人名のかな表記にゆれが存在してももれのない検索を可能とする近似文字列照合法を提案する。ゆれの問題に対処するためには表記を統一して検索を行うことが一般的であるが、現在かな表記を統一する墓準は明らかではなく、そのため統一すべきゆれが多種になった場合の対策も明らかになっていない。本文では日本人名約3 000万件を解析し、姓のゆれのデータを収集分析する。その結果、娃は9万種の姓のゆれ単位に分類できること、実データ上で58%の姓に何らかのゆれが存在すること、ゆれの原因は連濁などの接続部の変化が大部分を占めることを明らかにする。さらにこのゆれの関係に墓づいた正規化による照合を提案する。すなわち、実際にすべてのゆれを21 276組の文字列の等式関係で記述し、そこから自動的に15 841の正規化規則を作成して照合する方法を提案する。この正規化規則を使った照合法を人名の分布にしたがった検索に適用し、再現率と適合率の観点から評価を行った。その結果、93%の適合率を達成したうえで、完全一致検索では1検索あたり15%存在していたゆれによる検索もれを解消した。人名についてかな表記のゆれが荏在してももれのない検索が可能となった。","subitem_description_type":"Other"}]},"item_2_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"1915","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌"}],"bibliographicPageStart":"1906","bibliographicIssueDates":{"bibliographicIssueDate":"1995-08-15","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"8","bibliographicVolumeNumber":"36"}]},"relation_version_is_last":true,"item_2_alternative_title_2":{"attribute_name":"その他タイトル","attribute_value_mlt":[{"subitem_alternative_title":"情報検索"}]},"weko_creator_id":"1"},"created":"2025-01-18T22:47:49.548325+00:00","id":13848,"links":{}}