{"created":"2025-01-19T01:36:01.454942+00:00","updated":"2025-01-19T09:49:50.577670+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00234275","sets":["581:11492:11498"]},"path":["11498"],"owner":"44499","recid":"234275","title":["二人零和ゲームにおける突然変異駆動型正則化先導者追従法の終極反復収束"],"pubdate":{"attribute_name":"公開日","attribute_value":"2024-05-15"},"_buckets":{"deposit":"a167543b-d16e-4d2a-a15f-aa270f30da82"},"_deposit":{"id":"234275","pid":{"type":"depid","value":"234275","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"二人零和ゲームにおける突然変異駆動型正則化先導者追従法の終極反復収束","author_link":["638199","638198","638195","638194","638193","638200","638196","638197"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"二人零和ゲームにおける突然変異駆動型正則化先導者追従法の終極反復収束"},{"subitem_title":"Mutation-driven Follow the Regularized Leader for Last-iterate Convergence in Zero-sum Games","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"[一般論文(推薦論文)] 終極反復収束,正則化先導者追従法,零和ゲーム,突然変異付きレプリケータダイナミクス","subitem_subject_scheme":"Other"}]},"item_type_id":"2","publish_date":"2024-05-15","item_2_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"株式会社サイバーエージェント/電気通信大学"},{"subitem_text_value":"電気通信大学"},{"subitem_text_value":"電気通信大学"},{"subitem_text_value":"電気通信大学"}]},"item_2_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"CyberAgent, Inc. / The University of Electro-Communications","subitem_text_language":"en"},{"subitem_text_value":"The University of Electro-Communications","subitem_text_language":"en"},{"subitem_text_value":"The University of Electro-Communications","subitem_text_language":"en"},{"subitem_text_value":"The University of Electro-Communications","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/234275/files/IPSJ-JNL6505010.pdf","label":"IPSJ-JNL6505010.pdf"},"date":[{"dateType":"Available","dateValue":"2026-05-15"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-JNL6505010.pdf","filesize":[{"value":"1.2 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"8"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"e00706d1-d8e7-487c-854c-938a2b665ba9","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Information Processing Society of Japan"}]},"item_2_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"阿部, 拳之"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"豊島, 健太郎"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"坂本, 充生"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"岩崎, 敦"}],"nameIdentifiers":[{}]}]},"item_2_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Kenshi, Abe","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Kentaro, Toyoshima","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Mitsuki, Sakamoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Atsushi, Iwasaki","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_2_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN00116647","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_2_publisher_15":{"attribute_name":"公開者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"item_2_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7764","subitem_source_identifier_type":"ISSN"}]},"item_2_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本研究では,二人零和ゲームにおける正則化先導者追従法(Follow the Regularized Leader,FTRL)に突然変異を導入した学習アルゴリズムの帰結を吟味する.FTRLは,戦略の時間平均がナッシュ均衡に収束することが保証されているアルゴリズムのクラスである.しかし,その多くは周回軌道に陥ってしまい,均衡に直接収束しないことが知られている.そこで本研究では,進化ゲームの文脈でよく用いられる突然変異付きレプリケータダイナミクスと等価なやり方で,突然変異を利用したMutant FTRL(M-FTRL)を提案する.次いでM-FTRLの連続時間ダイナミクスを分析し,ナッシュ均衡に近似する定常点に向けての強い収束性を保証した.さらに,M-FTRLの突然変異項に含まれる参照戦略(reference strategy)を適宜更新することで,近似でない厳密なナッシュ均衡への直接収束(終極反復収束)を保証した.","subitem_description_type":"Other"}]},"item_2_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This study considers a variant of the Follow the Regularized Leader (FTRL) dynamics in two-player zero-sum games. FTRL is guaranteed to converge to a Nash equilibrium when time-averaging the strategies. At the same time, a lot of variants suffer from the issue of limit cycling behavior, i.e., lack the last-iterate convergence guarantee. To this end, we propose the mutant FTRL (M-FTRL) algorithm that introduces mutation to perturb action probabilities. We then investigate the continuous-time dynamics of M-FTRL and provide strong convergence guarantees toward stationary points that approximate a Nash equilibrium. Furthermore, by updating the reference strategy of the mutation term in M-FTRL, we ensure the last-iterate convergence to an exact Nash equilibrium. ","subitem_description_type":"Other"}]},"item_2_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"979","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌"}],"bibliographicPageStart":"968","bibliographicIssueDates":{"bibliographicIssueDate":"2024-05-15","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"5","bibliographicVolumeNumber":"65"}]},"relation_version_is_last":true,"item_2_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.20729/00234158","subitem_identifier_reg_type":"JaLC"}]},"weko_creator_id":"44499"},"id":234275,"links":{}}