{"updated":"2025-01-22T08:29:00.532400+00:00","links":{},"created":"2025-01-18T23:13:42.779983+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00048475","sets":["1164:4179:4229:4231"]},"path":["4231"],"owner":"1","recid":"48475","title":["機械学習を用いたタイ語の品詞タグづけ"],"pubdate":{"attribute_name":"公開日","attribute_value":"2001-09-10"},"_buckets":{"deposit":"5dbe8305-00b7-4626-bd28-c88263db06a4"},"_deposit":{"id":"48475","pid":{"type":"depid","value":"48475","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"機械学習を用いたタイ語の品詞タグづけ","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"機械学習を用いたタイ語の品詞タグづけ"},{"subitem_title":"POS Tagging in the Thai Language Using Machine - Learning Methods","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2001-09-10","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"独立行政法人通信総合研究所けいはんな情報通信融合研究センター"},{"subitem_text_value":"独立行政法人通信総合研究所けいはんな情報通信融合研究センター"},{"subitem_text_value":"独立行政法人通信総合研究所けいはんな情報通信融合研究センター"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Communications Research Laboratory","subitem_text_language":"en"},{"subitem_text_value":"Communications Research Laboratory","subitem_text_language":"en"},{"subitem_text_value":"Communications Research Laboratory","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/48475/files/IPSJ-NL01145007.pdf"},"date":[{"dateType":"Available","dateValue":"2003-09-10"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-NL01145007.pdf","filesize":[{"value":"1.1 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"23"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"d4b74795-9667-467a-bd1a-88480f385191","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2001 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"村田, 真樹"},{"creatorName":"馬青"},{"creatorName":"井佐原, 均"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Masaki, Murata","creatorNameLang":"en"},{"creatorName":"Ma, Qing","creatorNameLang":"en"},{"creatorName":"Hitoshi, Isahara","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10115061","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"われわれはこれまで,できるだけ少量の訓練データで実用的な品詞タグづけシステムを構築する目的で伸縮性入力ニューロタガー,ニューラルネットワークとBrillの誤り駆動学習を融合したハイブリッド型ニューロタガーを提案してきた。これらのタガーでは多品詞語を含む小規模タイ語コーパスを学習データとして,それぞれ94.4%,95.5%という高い精度(多品詞語のみを測定対象)で品詞のタグづけをした。本研究では,新たに決定リスト,最大エントロピー法,サポートベクトルマシン法の三つの機械学習法を用いるタイ語のタグづけの手法を提案し,それらを用いて品詞タグづけを行った。結果はサポートベクトルマシンがもっともよい精度(96.1%)を出し,さらにタイ語の品詞タグづけの精度向上を実現することになった。本稿では,手法間の比較や精度向上の原因についての考察も行なう。","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"The elastic-input neuro tagger and the hybrid neuro tagger combined the neural network and Brill's error-driven learning have already been proposed for the purpose of constructing a practical tagger that uses as little training data as possible. When a small Thai corpus is used for training, these taggers have tagging accuracies of 94.4% and 95.5% (accounting only for the ambiguous words in part of speech), respectively. In this study, we developed new tagging methods using the three machine learning methods: decision-list, maximum entropy, and support vector machine methods. We then performed tagging experiments using these methods. Our results showed that the support vector machine method has the best precision (96.1%), and that it is capable of improving the accuracy of tagging in the Thai language. Finally, we theoretically examined the above-mentioned methods and discussed how improvements have been made.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"50","bibliographic_titles":[{"bibliographic_title":"情報処理学会研究報告自然言語処理(NL)"}],"bibliographicPageStart":"45","bibliographicIssueDates":{"bibliographicIssueDate":"2001-09-10","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"86(2001-NL-145)","bibliographicVolumeNumber":"2001"}]},"relation_version_is_last":true,"weko_creator_id":"1"},"id":48475}