@article{oai:ipsj.ixsq.nii.ac.jp:00175956,
 author = {金澤, 裕治 and Yuzi, Kanazawa},
 issue = {11},
 journal = {情報処理学会論文誌},
 month = {Nov},
 note = {厳密解を求めるのが困難でヒューリスティクスによって解かれている問題で，計算機が熟練者を上回ることが困難なものが存在する．そのような問題において，ヒューリスティクス手法を多数のパラメータで制御できるようにしておき，そのパラメータを機械学習によりチューニングすることで，熟練者の判断を再現できれば，解法の性能向上が期待できる．そのために解決しなければならない課題の1つが，教師データの不足である．本論文では，教師データが不足した環境で学習結果に含まれる誤りを改善する強化学習類似手法を提案する．提案手法を将棋プログラムBonanza 6.0の機械学習テーブル改善に適用し，1回の適用でイロレーティングが平均25程度，繰り返し適用することで，最終的には150程度向上した．, There are some problems where human experts can produce better result than heuristics methods on computers. Performance of such heuristics methods may be improved significantly by machine learning on result by human experts. An issue that must be solved to make it possible is sample data shortage. This paper proposes a reinforcement-learning-like method to fix errors in machine learning result generated from insufficient sample data. The method was applied to refine parameters used by the shogi program Bonanza 6.0. Experimental results show that Elo rating of Bonanza 6.0 with refined parameters was improved by 150 points.},
 pages = {2382--2391},
 title = {教師データが不足した環境での機械学習結果改善手法},
 volume = {57},
 year = {2016}
}