@techreport{oai:ipsj.ixsq.nii.ac.jp:00194829, author = {森住, 哲也 and Tetsuya, Morizumi}, issue = {20}, month = {Feb}, note = {本論文では，＜私＞という視点を人工知能的システムに組み込むアプローチを示す．「それぞれの＜私＞が他者性を如何に解釈するか」という問いに対し，ウイトゲンシュタインの言語ゲームに於ける家族的類似の概念と世阿弥の離見の見の概念を確率モデルによって設計する．確率変数としての存在者は家族的類似として現れる．しかし一方で，その存在者はプレオーダーのテクストの族から全順序のテクストのクラスターヘと再構築されなければならない.そのための必要条件は次に示される：「テクストの家族的類似のクラスターの境界となる確率変数の確率分布を学習させる過程｣，即ち「順序関係の公理にしたがう決定論的なテクストのあつまりを生成する過程」が確率的に分析される．それにより大量のテクストから家族的類似を満たす順序関係の規則を抽出する．即ち，半順序関係，全順序関係の性質を持つテクストのクラスターが分析されることによって確率的世界から決定の世界の順序関係が導かれる．確率分布の家族的類似は情報理論的尺度の順序関係によって評価される．本論文では，私の意思を示す教師データを使用する，教師ありベイジアン逆強化学習 (Supervised Bayesian Inverse Reinforcement Learning (S-BIRL) ) のグラフイカルモデルを示す．S-BIRL は Blei の supervised LDA の潜在的確率変数を強化学習のアクションの潜在的なパラメーターと解釈し，かつ Ramage の Labeled LDA を強化学習の状態 S のラベルとして解釈するモデルである．, In this paper, we present an approach to incorporate the viewpoint of into an artificial intelligent system. To the question "How each mind interprets others'", "family resemblance" in Wittgenstein's language game and concepts of "Riken-no-ken (sight outside of sight)" used in Ze'ami's treatise on Noh are designed by probabilistic models. Those who exist as stochastic variables appear as family resemblance. But on the other hand, its existence must be reconstructed from the pre-order text group to the total order cluster. The requirements for this are as follows: "The process of learning the probability distribution of the random variable that becomes the boundary of the familial resemblance clusters of texts", that is, "the process of generating a set of deterministic texts that satisfies the axiom of order relation" is stochastically analyzed . It extracts rules of order relation satisfying the familial resemblance from a large amount of text. That is, by analyzing clusters of texts having partial-order relation and total-order relationship property, the order relation of decision world is derived from stochastic world. Family similarity of probability distribution is evaluated by order relation of information theoretic scale. In this paper, we show a graphical model of Supervised Bayesian Inverse Reinforcement Leaming (S - BIRL) using supervised data. S - BIRL is a model that interprets the potential random variable of Blei 's supervised LDA as a potential parameter of reinforcement learning actions and interprets Ramage's Labeled LDA as a label of reinforcement leaming state S.}, title = {情報理論的尺度に基づく家族的類似クラスターの順序関係の学習可能性について-Bayesian逆強化学習の報酬を家族的類似度と見做すこととは何か-}, year = {2019} }