{"created":"2025-01-19T01:42:20.872020+00:00","updated":"2025-01-19T08:26:03.048856+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00238971","sets":["1164:1165:11462:11709"]},"path":["11709"],"owner":"44499","recid":"238971","title":["体系的推論における言語モデルの内部挙動の分析"],"pubdate":{"attribute_name":"公開日","attribute_value":"2024-09-04"},"_buckets":{"deposit":"a0743ae2-e98a-4c38-996b-6f403a8d19f7"},"_deposit":{"id":"238971","pid":{"type":"depid","value":"238971","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"体系的推論における言語モデルの内部挙動の分析","author_link":["654587","654585","654584","654586"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"体系的推論における言語モデルの内部挙動の分析"},{"subitem_title":"Analysis of the internal behavior of language models in systematic reasoning","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"4C","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2024-09-04","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"京都産業大学情報理工学部"},{"subitem_text_value":"京都産業大学情報理工学部"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Faculty of Information Science and Engineering, Kyoto Sangyo University","subitem_text_language":"en"},{"subitem_text_value":"Faculty of Information Science and Engineering, Kyoto Sangyo University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/238971/files/IPSJ-DBS24179024.pdf","label":"IPSJ-DBS24179024.pdf"},"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-DBS24179024.pdf","filesize":[{"value":"3.4 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"0","billingrole":"13"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_login","version_id":"d83e66b2-e86b-4b13-b8a7-8ed173a99a7c","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Institute of Electronics, Information and Communication Engineers This SIG report is only available to those in membership of the SIG."}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"井上, 綾介"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"宮森, 恒"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Ryosuke, Inoue","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Hisashi, Miyamori","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10112482","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-871X","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"近年,言語モデルは人間のような流暢な言語生成能力を示している一方で,論理的な推論に関しては依然として未知の問題に汎化することが困難である.そこで本研究では,言語の体系性に着想を得て,言語モデルの汎化を目指す上で重要な要素を探るために命題論理に基づくデータセットを構築し,それを用いて言語モデルの内部挙動を分析する.具体的には,異なる形状の命題に対して汎化できるモデルとそうでないモデルの各ニューロンの活性化度合いを比較し,言語モデルの命題論理における体系性を担っていると考えられる箇所を特定する.実験では,パラメータ数の異なるデコーダモデルに対して分析し,その内部挙動を明らかにする.本研究により,言語モデルの分布外汎化を実現するための知見が得られることが期待される.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"Large Language Models have achieved remarkable advancements in natural language processing tasks such as language generation and translation recently. On the other hand, their ability to solve unseen logical inference problems is still limited, and it is unclear which parts of the models have the capability to store acquired knowledge and skills to generalize. In this paper, we draw inspiration from the systematicity of language to explore crucial elements for generalizing language models. To this end, we utilize a propositional logic dataset to analyze the internal behavior of language models. Specifically, we compare the activation of neurons in models that can generalize to different forms of propositions with those that cannot, identifying areas believed to be responsible for the systematicity of propositional logic within the language model.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告データベースシステム(DBS)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2024-09-04","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"24","bibliographicVolumeNumber":"2024-DBS-179"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":238971,"links":{}}