@techreport{oai:ipsj.ixsq.nii.ac.jp:00082459,
 author = {大矢, 隼士 and 森島, 繁生 and Hayato, Ohya and Shigeo, Morishima},
 issue = {10},
 month = {May},
 note = {インターネットの動画共有サイト上に存在するアマチュア制作の音楽動画を再利用することにより，自動的に音楽動画を生成するシステムを提案する．この音楽動画は，既存の音楽にゲームやアニメなどの映像を切り貼りして制作されたものであり，MAD 動画と呼ばれている．本稿では，以前筆者らグループが提案した DanceReProducer の学習手法を，マルコフ連鎖を使うことにより映像の時系列情報を考慮できるように改善し，Forward Viterbi アルゴリズムを用いて動画生成をおこなう．提案システムは，まずインターネット上にアップロードされている MAD 動画を大量に取得し，データベースとする．その後，データベースの動画から音楽特徴量，映像特徴量を抽出し一小節ごとにまとめ，楽曲の構造情報やテンポの推定をおこなう．次に，各特徴量をクラスタリングし，状態変数を音楽特徴量，潜在変数を映像特徴量として，潜在変数のマルコフ連鎖モデルを使用して学習する．動画の生成は，任意の楽曲 （入力楽曲） に対し，学習した同調関係から最も入力楽曲と同調する映像をデータベースから選び出し，切り貼りすることで新しい動画を自動的に生成している．, We propose automatic music video creating system by reusing music videos that are created by amateur users and existed on the video sharing service. These music videos are created by combining existing music with frames of video games, anime, and so on and are called ”MAD” movie. In this paper, we improved learning method of DanceReProducer that is the system our group proposed previously, by considering time series information of videos by using Markov chain, and we automatically generated MAD movie by using Forward Viterbi algorithm. First, we get a lot of MAD movie from the web and makes database. Next, music feature and video feature are extracted from MAD movies in the database, and gathered per bar. Then, each feature is clustered and learned by Markov model of latent variable as state variable is music feature and latent variable is video feature. At last, movie is automatically generated by selecting video frame, which is most synchronized with input music in the database, and combining input music with video frames.},
 title = {隠れマルコフモデルに基づく既存コンテンツ学習による音楽動画自動生成システムの提案},
 year = {2012}
}