{"updated":"2025-01-19T19:31:57.693990+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00206112","sets":["1164:4179:10245:10269"]},"path":["10269"],"owner":"44499","recid":"206112","title":["BERTの教師無しデータへの適用"],"pubdate":{"attribute_name":"公開日","attribute_value":"2020-06-26"},"_buckets":{"deposit":"ba483825-f8ba-4479-a2b0-d6726060c93b"},"_deposit":{"id":"206112","pid":{"type":"depid","value":"206112","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"BERTの教師無しデータへの適用","author_link":["511765","511764","511766","511773","511776","511771","511772","511769","511774","511779","511775","511777","511767","511778","511768","511770"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"BERTの教師無しデータへの適用"},{"subitem_title":"Application of BERT to Unsupervised Data","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2020-06-26","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"テンソル・コンサルティング株式会社"},{"subitem_text_value":"テンソル・コンサルティング株式会社"},{"subitem_text_value":"テンソル・コンサルティング株式会社"},{"subitem_text_value":"テンソル・コンサルティング株式会社"},{"subitem_text_value":"三菱重工業株式会社ICTソリューション本部EPI部"},{"subitem_text_value":"三菱重工業株式会社ICTソリューション本部EPI部"},{"subitem_text_value":"三菱重工業株式会社ICTソリューション本部EPI部"},{"subitem_text_value":"三菱重工業株式会社バリューチェーン本部プロジェクト部"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Tensor Consulting Co.Ltd.","subitem_text_language":"en"},{"subitem_text_value":"Tensor Consulting Co.Ltd.","subitem_text_language":"en"},{"subitem_text_value":"Tensor Consulting Co.Ltd.","subitem_text_language":"en"},{"subitem_text_value":"Tensor Consulting Co.Ltd.","subitem_text_language":"en"},{"subitem_text_value":"EPI Department/ICT Solution Headquarters/Mitsubishi Heavy Industries, Ltd.","subitem_text_language":"en"},{"subitem_text_value":"EPI Department/ICT Solution Headquarters/Mitsubishi Heavy Industries, Ltd.","subitem_text_language":"en"},{"subitem_text_value":"EPI Department/ICT Solution Headquarters/Mitsubishi Heavy Industries, Ltd.","subitem_text_language":"en"},{"subitem_text_value":"Project Department/Value Chain Headquarters/Mitsubishi Heavy Industries, Ltd.","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/206112/files/IPSJ-NL20244004.pdf","label":"IPSJ-NL20244004.pdf"},"date":[{"dateType":"Available","dateValue":"2022-06-26"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-NL20244004.pdf","filesize":[{"value":"1.2 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"23"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"a4900b61-83c2-474f-a833-57720373df1e","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2020 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"築地, 毅"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"鈴木, 晴也"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"柴原, 一友"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"藤本, 浩司"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"池田, 龍司"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"尾﨑, 和基"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"森田, 克明"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"松原, 敬信"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Tsuyoshi, Tsukiji","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Haruya, Suzuki","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Kazutomo, Shibahara","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Koji, Fujimoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Ryuji, Ikeda","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Kazuki, Ozaki","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Katsuaki, Morita","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Takanobu, Matsubara","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10115061","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8779","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本稿では,BERT を利用した教師無しデータへの適用について論ずる.近年ディープラーニングの技術が確立し始めており,特に画像認識分野において,既存の技術では困難だった特徴の自動抽出を実現したことにより,非常に高い精度を上げるようになってきている.自然言語処理においてもディープラーニングの研究は広く行われているが,近年 Google により発表された BERT の功績は大きく,教師あり学習のタスクに対して,既存の成果を大きく上回る成果を上げている.本稿では,教師あり学習の精度を大きく高めた BERT を教師無しデータに適用することで,既存手法の性能向上につながる可能性があるという仮説を主張する.本稿では,特許文書を対象に,教師あり学習を行わずに特許の類似性を図る実験を行った.実験の結果,人手で付与した特許分類フラグに対し 61.9 %の正解率となり,BERT を活用することで教師データを与えずとも,特許の類似度を表現できることを示した.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"In this paper, we discuss application of documents to unsupervised data using BERT. In recent years, the technology of deep learning had begun to be established, and in the field of image recognition, the automatic extraction of features that was difficult with existing technologies has led to very high accuracy. Deep learning has been widely studied in natural language processing, but in recent years, BERT, by Google, has achieved a great deal of success and has far exceeded the existing achievements for supervised learning tasks. In this paper, we assert that applying BERT, which greatly improves the accuracy of supervised learning, to unsupervised data may lead to better performance than existing methods. We did an experiment on similarity of patents for patent documents without supervised learning. As a result, the accuracy rate was 61.9% for the manually assigned patent classification flag, and it was shown that the similarity of patents could be expressed without using training data by using BERT.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"7","bibliographic_titles":[{"bibliographic_title":"研究報告自然言語処理(NL)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2020-06-26","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"4","bibliographicVolumeNumber":"2020-NL-244"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"created":"2025-01-19T01:08:12.500113+00:00","id":206112,"links":{}}