@techreport{weko_142439_1, author = "内部,英治", title = "How do we define the reward in reinforcement learning? ", year = "2015", institution = "沖縄科学技術大学院大学神経計算ユニット", number = "38", month = "jun" }