{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00055779","sets":["1164:5064:5071:5074"]},"path":["5074"],"owner":"1","recid":"55779","title":["歌声GMMとビタビ探索を用いた多重奏中のボーカルバートに限定した基本周波数推定手法"],"pubdate":{"attribute_name":"公開日","attribute_value":"2007-08-02"},"_buckets":{"deposit":"81eabbae-fef9-498b-8b24-f1e86893c35c"},"_deposit":{"id":"55779","pid":{"type":"depid","value":"55779","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"歌声GMMとビタビ探索を用いた多重奏中のボーカルバートに限定した基本周波数推定手法","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"歌声GMMとビタビ探索を用いた多重奏中のボーカルバートに限定した基本周波数推定手法"},{"subitem_title":"An FO estimation method for detecting vocal part in polyphonic music by using vocal GMM and Viterbi search ","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2007-08-02","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"産業技術総合研究所"},{"subitem_text_value":"産業技術総合研究所"},{"subitem_text_value":"京都大学大学院情報学研究科知能情報学専攻"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"National Institute of Advanced Industrial Science and Technology (AIST)","subitem_text_language":"en"},{"subitem_text_value":"National Institute of Advanced Industrial Science and Technology (AIST)","subitem_text_language":"en"},{"subitem_text_value":"Dept. of Intelligence Science and Technology, Graduate School of Infomatics, Kyoto University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/55779/files/IPSJ-MUS07071020.pdf"},"date":[{"dateType":"Available","dateValue":"2009-08-02"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-MUS07071020.pdf","filesize":[{"value":"821.0 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"21"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"1157cf71-c251-4666-80f8-4e712e57a8cf","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2007 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"藤原弘将"},{"creatorName":"後藤, 真孝"},{"creatorName":"奥乃, 博"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"HIROMASA, FUJIHARA","creatorNameLang":"en"},{"creatorName":"MASATAKA, GOTO","creatorNameLang":"en"},{"creatorName":"HIROSHI, G.OKUNO","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10438388","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本稿では,混合音中のボーカルパートの基本周波数(F0)を推定する手法について述べる,ボーカルパートは多くのジャンルの音楽で主要な役割を果たしており,ボーカルパートのF0推定は様々な用途に応用出来る.我々は,確率的定式化により,ボーカルパートのF0推定の問題を多重ピッチ解析問題と音源(歌声かどうか)認識問題に帰着させる.音源認識問題は,歌声/非歌声を表現する混合ガウス分布(GMM)を用いて,歌声確率を計算することで実現する.最後に,これらの確率的問題を最大化するF0の系列をピタピアルゴリズムによって推定する.評価実験により,F0推定精度が75.4%から 78.3%に向上し,誤り率を13.8%削減することを確認した.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This paper describes a method for estimating F0s of vocal part from polyphonic audio signals. Because melody is sung by a singer in many musical pieces, the estimation of F0s of the vocal part is useful for many applications. We separate the problem of estimating F0s of vocal into multiple-F0 estimation problem and sound source (vocal or not) recognition problem. To deal with the sound source recognition problem, we evaluate the vocal probability by using vocal and non-vocal Gaussian mixture models (GMMs), Finally, we estimate an F0 trajectory that maximize these stochastic problems, based on Viterbi search. Experimental results show that our method improves estimation accuracy from 75.4% to 78.3%, which is 13.8% reduction of misestimation. ","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"126","bibliographic_titles":[{"bibliographic_title":"情報処理学会研究報告音楽情報科学(MUS)"}],"bibliographicPageStart":"119","bibliographicIssueDates":{"bibliographicIssueDate":"2007-08-02","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"81(2007-MUS-071)","bibliographicVolumeNumber":"2007"}]},"relation_version_is_last":true,"weko_creator_id":"1"},"id":55779,"updated":"2025-01-22T05:17:41.799602+00:00","links":{},"created":"2025-01-18T23:19:20.876192+00:00"}