{"id":80409,"updated":"2025-01-21T19:49:10.393939+00:00","links":{},"created":"2025-01-18T23:34:53.629220+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00080409","sets":["1164:5064:6681:6682"]},"path":["6682"],"owner":"11","recid":"80409","title":["特徴空間における長時間スペクトル変動成分の識別学習"],"pubdate":{"attribute_name":"公開日","attribute_value":"2012-01-27"},"_buckets":{"deposit":"151a564b-fe07-4c62-84df-773ab24c7e1b"},"_deposit":{"id":"80409","pid":{"type":"depid","value":"80409","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"特徴空間における長時間スペクトル変動成分の識別学習","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"特徴空間における長時間スペクトル変動成分の識別学習"},{"subitem_title":"Feature-space Discriminative Training for Long-term spectro-temporal Features","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"学習・支援","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2012-01-27","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"日本アイ・ビー・エム株式会社東京基礎研究所"},{"subitem_text_value":"日本アイ・ビー・エム株式会社東京基礎研究所"},{"subitem_text_value":"日本アイ・ビー・エム株式会社東京基礎研究所"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"IBM Research - Tokyo, IBM Japan, Ltd.","subitem_text_language":"en"},{"subitem_text_value":"IBM Research - Tokyo, IBM Japan, Ltd.","subitem_text_language":"en"},{"subitem_text_value":"IBM Research - Tokyo, IBM Japan, Ltd.","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/80409/files/IPSJ-MUS12094021.pdf"},"date":[{"dateType":"Available","dateValue":"2014-01-27"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-MUS12094021.pdf","filesize":[{"value":"521.1 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"21"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"35de3216-68e9-49fa-b5a4-7150ec6b28b8","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2012 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"福田, 隆"},{"creatorName":"市川, 治"},{"creatorName":"西村, 雅史"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Takashi, Fukuda","creatorNameLang":"en"},{"creatorName":"Osamu, Ichikawa","creatorNameLang":"en"},{"creatorName":"Masafumi, Nishimura","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10438388","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"近年,特徴空間上の識別学習 (fMMI) が注目され,多くの認識システムで効果を挙げている.通常,識別的特徴変換器には,MFCC+ 動的特徴やセグメント特徴量 +LDA などのスペクトル変動情報を含む特徴パラメータが入力され,それが正準化空間に写像される.特徴空間上の識別学習は近代音声認識において不可欠な要素であるが,低 SNR 環境ではまだ改善の余地がある.本報告では,識別的特徴変換の枠組みに,雑音環境で頑健な性質を示す長時間スペクトル変動情報を組み込むことを提案する.提案手法は低 SNR 環境下で MFCC と動的特徴からなる標準的な特徴ベクトルセットと比較して 6.3% の性能改善を達成した.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"Discriminative training of feature space using a maximum mutual information (fMMI) objective function has been shown to yield remarkable accuracy improvements. MFCC and dynamic features or LDA features are usually used for discriminative feature transform to map the features into canonicalized feature space. Discriminatively trained feature space transforms are essential for modern speech recognition but still need further improvement for low SNR conditions. In this paper, we show how noise-robust long-term temporal features can be combined with fMMI to build better discriminative models for noisy speech. The fMMI combined with long-term temporal features achieved 6.3% error reduction on average in low SNR environments when compared to the short-term temporal features alone.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音楽情報科学(MUS)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2012-01-27","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"21","bibliographicVolumeNumber":"2012-MUS-94"}]},"relation_version_is_last":true,"weko_creator_id":"11"}}