{"created":"2025-01-18T23:20:25.013201+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00057151","sets":["1164:5159:5192:5193"]},"path":["5193"],"owner":"1","recid":"57151","title":["DAEMアルゴリズムの話者・音声認識における有効性の検討"],"pubdate":{"attribute_name":"公開日","attribute_value":"2003-12-18"},"_buckets":{"deposit":"cc9ee44b-60ad-4397-b945-8a51f4f8d1c4"},"_deposit":{"id":"57151","pid":{"type":"depid","value":"57151","revision_id":0},"owners":[1],"status":"published","created_by":1},"item_title":"DAEMアルゴリズムの話者・音声認識における有効性の検討","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"DAEMアルゴリズムの話者・音声認識における有効性の検討"},{"subitem_title":"Deterministic Annealing EM algorithm for speaker and speech recognition","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2003-12-18","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"名古屋工業大学"},{"subitem_text_value":"名古屋工業大学"},{"subitem_text_value":"名古屋工業大学"},{"subitem_text_value":"名古屋大学"},{"subitem_text_value":"名古屋工業大学"},{"subitem_text_value":"名古屋工業大学"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Department of Computer Science and Enginnering, Nagoya Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Department of Computer Science and Enginnering, Nagoya Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Department of Computer Science and Enginnering, Nagoya Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Department of Media Science, Nagoya University","subitem_text_language":"en"},{"subitem_text_value":"Department of Computer Science and Enginnering, Nagoya Institute of Technology","subitem_text_language":"en"},{"subitem_text_value":"Department of Computer Science and Enginnering, Nagoya Institute of Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/57151/files/IPSJ-SLP03049001.pdf"},"date":[{"dateType":"Available","dateValue":"2005-12-18"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-SLP03049001.pdf","filesize":[{"value":"579.1 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"22"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"bb64b8dd-16d4-4ff0-bd22-f97cc9fd4db6","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2003 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"板谷, 洋平"},{"creatorName":"全, 炳河"},{"creatorName":"南角吉彦"},{"creatorName":"宮島, 千代美"},{"creatorName":"徳田, 恵一"},{"creatorName":"北村, 正"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Y., Itaya","creatorNameLang":"en"},{"creatorName":"H., Zen","creatorNameLang":"en"},{"creatorName":"Y., Nankaku","creatorNameLang":"en"},{"creatorName":"C., Miyajima","creatorNameLang":"en"},{"creatorName":"K., Tokuda","creatorNameLang":"en"},{"creatorName":"T., Kitamura","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10442647","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"GMM(Gaussian Mixture Model)やHMM(Hidden Markov Moldel)のパラメータ推定には,広くEM(Expectation Maximization)アルゴリズムが用いられる.しかし,EMアルゴリズムは,推定結果が初期値設定に依存してしまうという,局所最適性の問題を有する.この問題に対処するためにDAEM(Deterministic Annealing Expectation Maximization)アルゴリズムが提案された.本稿では,このDAEMアルゴリズムをGMM,及び音素境界情報が得られない場合のHMMのパラメータ推定(フラットスタート)にそれぞれ適用し,GMMを用いた話者認識,及びHMMを用いた連続音声認識における有効性に関する検討を行う.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This paper investigates the effectiveness of a DAEM (Deterministic Annealing Expectation Maximization) algorithm for speaker and speech recognition. The EM (Expectation Maximization) algorithm is widely used for paramete estimation of statistical models. However, the EM algorithm has the problem of initialization dependence. To relax this problem, the DAEM algorithm has been proposed. In this paper, we apply the DAEM algorithm to estimate acoustic models for speaker recognition and continuous speech recognition.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"情報処理学会研究報告音声言語情報処理(SLP)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2003-12-18","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"124(2003-SLP-049)","bibliographicVolumeNumber":"2003"}]},"relation_version_is_last":true,"weko_creator_id":"1"},"id":57151,"updated":"2025-01-22T04:36:29.166946+00:00","links":{}}