{"links":{},"id":100930,"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00100930","sets":["5471:7431:7566"]},"path":["7566"],"owner":"11","recid":"100930","title":["Encouragement of Right Social Norms by Inverse Reinforcement Learning"],"pubdate":{"attribute_name":"公開日","attribute_value":"2014-04-15"},"_buckets":{"deposit":"210c37a2-7bc5-462a-bcf3-57200ef6e38d"},"_deposit":{"id":"100930","pid":{"type":"depid","value":"100930","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"Encouragement of Right Social Norms by Inverse Reinforcement Learning","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Encouragement of Right Social Norms by Inverse Reinforcement Learning"},{"subitem_title":"Encouragement of Right Social Norms by Inverse Reinforcement Learning","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"[Special Issue on Multiagent-based Societal Systems] inverse reinforcement learning, social norms","subitem_subject_scheme":"Other"}]},"item_type_id":"5","publish_date":"2014-04-15","item_5_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"Chiba University"},{"subitem_text_value":"Japan Maritime Self-Defense Force"}]},"item_5_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Chiba University","subitem_text_language":"en"},{"subitem_text_value":"Japan Maritime Self-Defense Force","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/100930/files/IPSJ-JIP2202026.pdf"},"date":[{"dateType":"Available","dateValue":"2016-04-15"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-JIP2202026.pdf","filesize":[{"value":"701.6 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"0","billingrole":"5"},{"tax":["include_tax"],"price":"0","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"2b4ccaac-dd4a-45e6-aab3-65106073ca06","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2014 by the Information Processing Society of Japan"}]},"item_5_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Sachiyo, Arai"},{"creatorName":"Kanako, Suzuki"}],"nameIdentifiers":[{}]}]},"item_5_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Sachiyo, Arai","creatorNameLang":"en"},{"creatorName":"Kanako, Suzuki","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_5_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA00700121","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_5_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-6652","subitem_source_identifier_type":"ISSN"}]},"item_5_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"This study is intended to encourage appropriate social norms among multiple agents. Effective norms, such as those emerging from sustained individual interactions over time, can make agents act cooperatively to optimize their performance. We introduce a “social learning” model in which agents mutually interact under a framework of the coordination game. Because coordination games have dual equilibria, social norms are necessary to make agents converge to a unique equilibrium. As described in this paper, we present the emergence of a right social norm by inverse reinforcement learning, which is an approach for extracting a reward function from the observation of optimal behaviors. First, we let a mediator agent estimate the reward function by inverse reinforcement learning from the observation of a master's behavior. Secondly, we introduce agents who act according to an estimated reward function in the multiagent world in which most agents, called citizens, have no way to act. Finally, we evaluate the effectiveness of introducing inverse reinforcement learning.","subitem_description_type":"Other"}]},"item_5_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This study is intended to encourage appropriate social norms among multiple agents. Effective norms, such as those emerging from sustained individual interactions over time, can make agents act cooperatively to optimize their performance. We introduce a “social learning” model in which agents mutually interact under a framework of the coordination game. Because coordination games have dual equilibria, social norms are necessary to make agents converge to a unique equilibrium. As described in this paper, we present the emergence of a right social norm by inverse reinforcement learning, which is an approach for extracting a reward function from the observation of optimal behaviors. First, we let a mediator agent estimate the reward function by inverse reinforcement learning from the observation of a master's behavior. Secondly, we introduce agents who act according to an estimated reward function in the multiagent world in which most agents, called citizens, have no way to act. Finally, we evaluate the effectiveness of introducing inverse reinforcement learning.","subitem_description_type":"Other"}]},"item_5_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"306","bibliographic_titles":[{"bibliographic_title":"Journal of information processing"}],"bibliographicPageStart":"299","bibliographicIssueDates":{"bibliographicIssueDate":"2014-04-15","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"2","bibliographicVolumeNumber":"22"}]},"relation_version_is_last":true,"weko_creator_id":"11"},"created":"2025-01-18T23:46:37.151772+00:00","updated":"2025-01-21T11:30:56.795430+00:00"}