{"updated":"2025-01-22T23:32:19.583895+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00017085","sets":["934:989:994:995"]},"path":["995"],"owner":"1","recid":"17085","title":["強化学習エージェントによる協調行動とコミュニケーションの創発"],"pubdate":{"attribute_name":"公開日","attribute_value":"2007-12-15"},"_buckets":{"deposit":"6088f24f-7d86-459f-92e8-f034dad55ec7"},"_deposit":{"id":"17085","pid":{"type":"depid","value":"17085","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"強化学習エージェントによる協調行動とコミュニケーションの創発","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"強化学習エージェントによる協調行動とコミュニケーションの創発"},{"subitem_title":"Emergence of Communication and Cooperative Behavior by Reinforcement Learning Agents","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"シンポジウム特集","subitem_subject_scheme":"Other"}]},"item_type_id":"3","publish_date":"2007-12-15","item_3_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"独立行政法人沖縄科学技術研究基盤整備機構大学院大学先行研究プロジェクト 現在,独立行政法人国立高等専門学校機構沖縄工業高等専門学校メディア情報工学科"},{"subitem_text_value":"独立行政法人沖縄科学技術研究基盤整備機構大学院大学先行研究プロジェクト"},{"subitem_text_value":"独立行政法人沖縄科学技術研究基盤整備機構大学院大学先行研究プロジェクト"}]},"item_3_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Initial Research Project (IRP), Okinawa Institute of Science and Technology (OIST) Promotion Corporation, Presently with Media Information Engineering, Okinawa National College of Technology (ONCT)","subitem_text_language":"en"},{"subitem_text_value":"Initial Research Project (IRP), Okinawa Institute of Science and Technology (OIST) Promotion Corporation","subitem_text_language":"en"},{"subitem_text_value":"Initial Research Project (IRP), Okinawa Institute of Science and Technology (OIST) Promotion Corporation","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/17085/files/IPSJ-TOM4819007.pdf"},"date":[{"dateType":"Available","dateValue":"2009-12-15"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-TOM4819007.pdf","filesize":[{"value":"2.1 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"17"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"6e3d9a95-f5eb-4fab-a459-39359127718d","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2007 by the Information Processing Society of Japan"}]},"item_3_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"佐藤尚"},{"creatorName":"内部, 英治"},{"creatorName":"銅谷, 賢治"}],"nameIdentifiers":[{}]}]},"item_3_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Takashi, Sato","creatorNameLang":"en"},{"creatorName":"Eiji, Uchibe","creatorNameLang":"en"},{"creatorName":"Kenji, Doya","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_3_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA11464803","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_3_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7780","subitem_source_identifier_type":"ISSN"}]},"item_3_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"コミュニケーションの原型は,個体が環境や他の個体との相互作用において,報酬の獲得や適応度の向上に寄与する形で発現したと考えられる.本研究では,報酬最大化を目的とする強化学習エージェントが,余剰な行動と感覚の自由度をコミュニケーショのために使うことを学習できるための条件を,2個体が互いに相手の縄張りに入ると報酬を得るが衝突すると罰を受けるというゲームにより検証した.このゲームでは,コミュニケーションと協調行動のそれぞれが必須ではないが,発光行動を使えるエージェント間では,互いにその光を信号として利用することで衝突を避け,報酬を獲得し合う協調行動の創発が観察された.信号の表現の仕方には多様性が見られ,また作業記憶を持つエージェント間では,信号を送る側とそれに従う側という役割分化も見られた.これは,コミュニケーションと協調行動が必須ではない状況において,意味と信号の任意の対応付けによるコミュニケーションが,コミュニケーションの達成そのものを目的としなくても一般的な行動学習の枠組みにより創発しうることを示す初めての知見である.","subitem_description_type":"Other"}]},"item_3_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"The prototype of symbolic communication would have emerged to help individuals to earn rewards and to improve fitness by using their excess degrees of freedom in action and perception. In this paper, we investigate whether and how reinforcement learning agents who aim at maximizing rewards can learn to use their redundant actions for communication in a simple game where the two agents learn to earn rewards by intruding into the other's territory on a linear track. In this task, although both cooperation and communication are not imperative, we found that the agents with lights and light sensors are able to achieve cooperative behaviors by avoiding collisions using visual communication in the middle of the track. Further analysis reveals a variety in the mapping of messages to signals. In some cases, the differentiation of roles into a sender and a receiver was observed. This is to our knowledge the first demonstration of emergence of communication by arbitrary meaning-coding mapping without an explicit objective of communication itself in a situation in which both cooperation and communication are not indispensable.","subitem_description_type":"Other"}]},"item_3_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"67","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌数理モデル化と応用(TOM)"}],"bibliographicPageStart":"55","bibliographicIssueDates":{"bibliographicIssueDate":"2007-12-15","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"SIG19(TOM19)","bibliographicVolumeNumber":"48"}]},"relation_version_is_last":true,"weko_creator_id":"1"},"created":"2025-01-18T22:50:10.690470+00:00","id":17085,"links":{}}