@techreport{oai:ipsj.ixsq.nii.ac.jp:00050681,
 author = {山本, 真也 and 山口, 文彦 and 斎藤, 博昭 and 中西, 正和 and Shinya, Yamamoto and Fumihiko, Yamaguchi and Hiroaki, Saito and Masakazu, Nakanishi},
 issue = {3(1999-ICS-119)},
 month = {Jan},
 note = {非マルコフ決定過程(non-MDP)の環境における強化学習の問題点の解決法として，環境変化時に何らかの処理を行う方法が提案されている．これらの研究において，環境変化の認識法は確立されていない．本論文では，non-MDPにおける有力な学習エンジンである確率的傾斜法において，学習中に環境変化を認識する方法を提案する．確率的傾斜法の内部変数Wの変化量を調べることにより環境変化を認識する．提案手法は確率的傾斜法が適用できる問題であれば簡単に内部に組み込むことのでき，環境変化の認識を行うことができる．シミュレーション実験により従来の手法の半分程度のステップで環境変化を認識できることを示す．, There are some methods that resolve problems of reinforcement learning in non Marokov Decision Process(non-MDP) environment on environment changes. The efficient method of recognizing environmental change has not yet been proposed. This paper proposes a method for recognizing environmental changes on Stochastic Gradient Ascent(SGA) which is a major learning engine in non-MDP environment. It uses the change of an internal variable W of SGA. Our method can be easily put in SGA and it is available for all SGA-applicable problems. We had a simulation to show the efficiency of our method and succeeded to reduce the recognition time to almost half of the conventional method.},
 title = {強化学習における環境変化認識法},
 year = {2000}
}