{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00213444","sets":["6164:6165:6210:10734"]},"path":["10734"],"owner":"44499","recid":"213444","title":["Improve Counterfactual Regret Minimization Agents Training by Setting Limitations ofNumbers of Steps in Games"],"pubdate":{"attribute_name":"公開日","attribute_value":"2021-11-06"},"_buckets":{"deposit":"fd2e6037-6ee6-43f1-9a21-eaa41a2e0787"},"_deposit":{"id":"213444","pid":{"type":"depid","value":"213444","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"Improve Counterfactual Regret Minimization Agents Training by Setting Limitations ofNumbers of Steps in Games","author_link":["546174","546171","546173","546172"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Improve Counterfactual Regret Minimization Agents Training by Setting Limitations ofNumbers of Steps in Games"},{"subitem_title":"Improve Counterfactual Regret Minimization Agents Training by Setting Limitations ofNumbers of Steps in Games","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"Imperfect Information Games","subitem_subject_scheme":"Other"},{"subitem_subject":"Counterfactual Regret Minimization","subitem_subject_scheme":"Other"},{"subitem_subject":"Abstraction technique","subitem_subject_scheme":"Other"},{"subitem_subject":"Curriculum Learning","subitem_subject_scheme":"Other"},{"subitem_subject":"Card Game Cheat","subitem_subject_scheme":"Other"}]},"item_type_id":"18","publish_date":"2021-11-06","item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_18_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Arts and Sciences, the University of Tokyo"},{"subitem_text_value":"Graduate School of Arts and Sciences, the University of Tokyo"}]},"item_18_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Arts and Sciences, the University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Arts and Sciences, the University of Tokyo","subitem_text_language":"en"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/213444/files/IPSJ-GPWS2021023.pdf","label":"IPSJ-GPWS2021023.pdf"},"date":[{"dateType":"Available","dateValue":"2021-11-06"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-GPWS2021023.pdf","filesize":[{"value":"948.3 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"0","billingrole":"5"},{"tax":["include_tax"],"price":"0","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"18"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"5fc58457-1ade-46f6-8656-6bb6705863ff","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2021 by the Information Processing Society of Japan"}]},"item_18_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Cheng, Yi"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tomoyuki, Kaneko"}],"nameIdentifiers":[{}]}]},"item_18_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Cheng, Yi","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tomoyuki, Kaneko","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_5794","resourcetype":"conference paper"}]},"item_18_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"Counterfactual Regret Minimization (CFR) has been one of the most famous algorithms to learn decent strategies of imperfect information games. Because CFR requires traversing the whole or part of game tree every iteration, it is infeasible to handle games with repetition where the game tree is not finite. In this paper, we introduce two abstraction techniques, one of which is to make the game tree finite and the other one is to reduce the size of game trees. Our experiments are conducted in an imperfect information card game called Cheat and we introduce the notion of “Health Points” a player has in each game to make the game length finite thus easier to handle. We utilize the information sets abstraction technique to speedup the training and evaluate how results from smaller games can improve training in larger ones. We also show Ordered Abstraction can help us increase the learning efficiency of specific agents.","subitem_description_type":"Other"}]},"item_18_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"Counterfactual Regret Minimization (CFR) has been one of the most famous algorithms to learn decent strategies of imperfect information games. Because CFR requires traversing the whole or part of game tree every iteration, it is infeasible to handle games with repetition where the game tree is not finite. In this paper, we introduce two abstraction techniques, one of which is to make the game tree finite and the other one is to reduce the size of game trees. Our experiments are conducted in an imperfect information card game called Cheat and we introduce the notion of “Health Points” a player has in each game to make the game length finite thus easier to handle. We utilize the information sets abstraction technique to speedup the training and evaluate how results from smaller games can improve training in larger ones. We also show Ordered Abstraction can help us increase the learning efficiency of specific agents.","subitem_description_type":"Other"}]},"item_18_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"123","bibliographic_titles":[{"bibliographic_title":"ゲームプログラミングワークショップ2021論文集"}],"bibliographicPageStart":"117","bibliographicIssueDates":{"bibliographicIssueDate":"2021-11-06","bibliographicIssueDateType":"Issued"},"bibliographicVolumeNumber":"2021"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":213444,"updated":"2025-01-19T17:09:36.351488+00:00","links":{},"created":"2025-01-19T01:14:19.319709+00:00"}