{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00074033","sets":["1164:4179:6308:6410"]},"path":["6410"],"owner":"10","recid":"74033","title":["機械学習による近代文語文への濁点の自動付与"],"pubdate":{"attribute_name":"公開日","attribute_value":"2011-05-09"},"_buckets":{"deposit":"f5657782-c76a-4d39-96f2-96778f40b2b8"},"_deposit":{"id":"74033","pid":{"type":"depid","value":"74033","revision_id":0},"owners":[10],"status":"published","created_by":10},"item_title":"機械学習による近代文語文への濁点の自動付与","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"機械学習による近代文語文への濁点の自動付与"},{"subitem_title":"A Machine Learning Approach to Automatic Labeling of Voiced Consonants for Modern Japanese Literary Text","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"学生セッション(1)","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2011-05-09","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"奈良先端科学技術大学院大学"},{"subitem_text_value":"奈良先端科学技術大学院大学"},{"subitem_text_value":"国立国語研究所"},{"subitem_text_value":"奈良先端科学技術大学院大学"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Nara Institute of Science and Technology","subitem_text_language":"en"},{"subitem_text_value":"Nara Institute of Science and Technology","subitem_text_language":"en"},{"subitem_text_value":"National Institute for Japanese Language and Linguistics","subitem_text_language":"en"},{"subitem_text_value":"Nara Institute of Science and Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/74033/files/IPSJ-NL11201006.pdf"},"date":[{"dateType":"Available","dateValue":"2013-05-09"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-NL11201006.pdf","filesize":[{"value":"776.5 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"23"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"83bc7dd6-2d6e-4d46-a457-2c9d67f536e5","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2011 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"岡, 照晃"},{"creatorName":"小町, 守"},{"creatorName":"小木曽, 智信"},{"creatorName":"松本, 裕治"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Teruaki, Oka","creatorNameLang":"en"},{"creatorName":"Mamoru, Komachi","creatorNameLang":"en"},{"creatorName":"Toshinobu, Ogiso","creatorNameLang":"en"},{"creatorName":"Yuji, Matsumoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10115061","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"現代日本語のように,濁音を仮名で表記する際に必ず濁点を用いる習慣が定着したのは明治時代以降のことで,明治期の文献の中では濁音が期待される文字に濁点のない濁点無表記の場合が多い.本論文では,濁点無表記の濁音仮名文字を識別し,自動で濁点を補う手法について述べる.我々は,判定点の文字が濁点無表記文字か否かを決定する2値分類問題として定式化を行った.提案手法では,周辺文字列の情報のみを用いて点推定を行う.オンライン学習を採用し,大規模な『太陽コーパス』から学習を行なった.これにより提案手法は,『国民之友』において96.016%の精度と98.283%の再現率を達成した.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"The present-day Japanese use of voiced consonant mark had established in Meiji Era. Thus, modern Japanese literary text written in Meiji Era often lacks compulsory voiced consonant marks. In this paper, we propose an approach to automatic labeling of voiced consonants for modern Japanese literary language. We formulate the task of labeling voiced consonants into binary classification problem. Our method uses as its feature set only surface information about the surrounding character strings with pointwise prediction. We use an online learning method for exploiting large datasets from Taiyo Corpus. We achieve 96.016% precision and 98.283% recall on the Kokumin_no_tomo Corpus.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"8","bibliographic_titles":[{"bibliographic_title":"研究報告自然言語処理(NL)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2011-05-09","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"6","bibliographicVolumeNumber":"2011-NL-201"}]},"relation_version_is_last":true,"weko_creator_id":"10"},"id":74033,"updated":"2025-01-21T21:43:14.813334+00:00","links":{},"created":"2025-01-18T23:31:44.282786+00:00"}