{"id":160407,"updated":"2025-01-20T12:18:57.295620+00:00","links":{},"created":"2025-01-19T00:33:19.430032+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00160407","sets":["1164:5064:8574:8710"]},"path":["8710"],"owner":"11","recid":"160407","title":["動的圧縮型ガンマチャープフィルタバンクを用いた音声明瞭度予測法:強調音声を対象とした比較検討"],"pubdate":{"attribute_name":"公開日","attribute_value":"2016-05-14"},"_buckets":{"deposit":"f5987edd-e936-4993-95a5-de12257ae8f8"},"_deposit":{"id":"160407","pid":{"type":"depid","value":"160407","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"動的圧縮型ガンマチャープフィルタバンクを用いた音声明瞭度予測法:強調音声を対象とした比較検討","author_link":["310327","310336","310337","310332","310326","310335","310329","310331","310333","310328","310334","310330"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"動的圧縮型ガンマチャープフィルタバンクを用いた音声明瞭度予測法:強調音声を対象とした比較検討"},{"subitem_title":"Predicting speech intelligibility using the dynamic compressive gammachirp filterbank: comparison with the result for enhanced speech","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2016-05-14","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"Wakayama University"},{"subitem_text_value":"Wakayama University"},{"subitem_text_value":"Wakayama University"},{"subitem_text_value":"NTT Communication Science Laboratories"},{"subitem_text_value":"NTT Communication Science Laboratories"},{"subitem_text_value":"NTT Communication Science Laboratories"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Wakayama University","subitem_text_language":"en"},{"subitem_text_value":"Wakayama University","subitem_text_language":"en"},{"subitem_text_value":"Wakayama University","subitem_text_language":"en"},{"subitem_text_value":"NTT Communication Science Laboratories","subitem_text_language":"en"},{"subitem_text_value":"NTT Communication Science Laboratories","subitem_text_language":"en"},{"subitem_text_value":"NTT Communication Science Laboratories","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/160407/files/IPSJ-MUS16111020.pdf","label":"IPSJ-MUS16111020.pdf"},"date":[{"dateType":"Available","dateValue":"2018-05-14"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-MUS16111020.pdf","filesize":[{"value":"486.6 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"21"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"c2170ba5-8cd1-4b26-8c3a-0b4d8d22122d","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2016 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"山本, 克彦"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"入野, 俊夫"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"松井, 淑恵"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"荒木, 章子"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"木下, 慶介"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"中谷, 智広"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Katsuhiko, Yamamoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Toshio, Irino","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Toshie, Matsui","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Shoko, Araki","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Keisuke, Kinoshita","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tomohiro, Nakatani","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10438388","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8752","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"聴覚モデルベースで音声明瞭度を予測する客観的評価指標は,音声強調処理技術を評価するためにも必要不可欠である.しかし,従来法 (sEPSM) では聴覚末梢系の音圧依存特性 (圧縮特性) が反映されていない上に,スペクトル減算法以外の非線形な音声強調処理手法では評価されていなかった.本研究では,動的圧縮型ガンマチャープフィルタバンクを用いた音声明瞭度の予測法 (dcGC-sEPSM) を提案した.非線形の音声強調処理手法であるスペクトル減算法とウィナーフィルタ型の雑音抑圧法を用いて聴取実験を行った.客観的評価として,提案法 (dcGC-sEPSM) および既存法 (GT-sEPSM, CSII, STOI) を用いて音声明瞭度の予測を行った.聴取実験から得られた音声明瞭度と比較した結果,提案法は既存法よりも聴取実験の傾向に近い音声明瞭度を予測することがわかった.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"An objective measure index of speech intelligibility based on auditory models is essential to evaluate speech enhancement techniques. The conventional method (sEPSM) was proposed to account for subjective results on a spectral subtraction, but has not been tested by recent state-of-the-art speech enhancement algorithms. We developed a new method using the dynamic compressive gammachirp auditory filterbank (dcGC-sEPSM) for speech intelligibility (SI) prediction of synthetic sounds processed by nonlinear speech enhancement algorithms. Subjective experiments were performed by using the spectral subtraction and a recent Wiener filter algorithm. We compared the subjective SI scores with the objective SI scores predicted by the proposed dcGC-sEPSM, the original sEPSM, the three-level coherence SII (CSII), and the short-time objective intelligibility (STOI). The results show that the dcGC-sEPSM performs better than the conventional models.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音楽情報科学(MUS)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2016-05-14","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"20","bibliographicVolumeNumber":"2016-MUS-111"}]},"relation_version_is_last":true,"weko_creator_id":"11"}}