{"id":231302,"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00231302","sets":["1164:5159:11151:11431"]},"path":["11431"],"owner":"44499","recid":"231302","title":["誤り検出とコンテキスト適応誤り訂正による音声認識における希少語認識精度改善"],"pubdate":{"attribute_name":"公開日","attribute_value":"2023-11-25"},"_buckets":{"deposit":"ab807d9f-5a87-48a4-a77e-dd269df23c70"},"_deposit":{"id":"231302","pid":{"type":"depid","value":"231302","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"誤り検出とコンテキスト適応誤り訂正による音声認識における希少語認識精度改善","author_link":["624217","624215","624214","624218","624216","624213"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"誤り検出とコンテキスト適応誤り訂正による音声認識における希少語認識精度改善"},{"subitem_title":"Enhancing Recognition of Rare Words in ASR through Error Detection and Context-Aware Error Correction","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"分野横断(1)","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2023-11-25","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"名古屋大学情報学研究科知能システム学専攻"},{"subitem_text_value":"名古屋大学情報基盤センター"},{"subitem_text_value":"名古屋大学情報基盤センター"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":" Graduate School of Informatics, Nagoya University","subitem_text_language":"en"},{"subitem_text_value":"Information Technology Center, Nagoya University","subitem_text_language":"en"},{"subitem_text_value":"Information Technology Center, Nagoya University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/231302/files/IPSJ-SLP23149010.pdf","label":"IPSJ-SLP23149010.pdf"},"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-SLP23149010.pdf","filesize":[{"value":"1.1 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"0","billingrole":"22"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_login","version_id":"76810f89-2370-41d2-917e-47301d961fc0","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2023 by the Institute of Electronics, Information and Communication Engineers This SIG report is only available to those in membership of the SIG."}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"何, 嘉俊"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"楊, 沢坤"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"戸田, 智基"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Jiajun, He","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Zekun, Yang","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tomoki, Toda","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10442647","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8663","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"Automatic speech recognition (ASR) systems often suffer from errors, particularly when recognizing rare words. These errors can be detrimental to downstream tasks such as keyword spotting and language understanding. To alleviate this issue, we propose an ASR error correction method that improves rare word recognition based on error detection and context-aware error correction. Our proposed method limits decoding to only the positions where corrections are required to minimize unnecessary computations. A rare word list is also used to provide additional contextual information for the model to correct errors related to rare words. Experimental results demonstrate that our proposed method outperforms previous works by a large margin in word error rate (WER) on five public datasets while also maintaining a reasonable inference speed. Additionally, the proposed method shows reasonable robustness across different ASR systems.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"Automatic speech recognition (ASR) systems often suffer from errors, particularly when recognizing rare words. These errors can be detrimental to downstream tasks such as keyword spotting and language understanding. To alleviate this issue, we propose an ASR error correction method that improves rare word recognition based on error detection and context-aware error correction. Our proposed method limits decoding to only the positions where corrections are required to minimize unnecessary computations. A rare word list is also used to provide additional contextual information for the model to correct errors related to rare words. Experimental results demonstrate that our proposed method outperforms previous works by a large margin in word error rate (WER) on five public datasets while also maintaining a reasonable inference speed. Additionally, the proposed method shows reasonable robustness across different ASR systems.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音声言語情報処理(SLP)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2023-11-25","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"10","bibliographicVolumeNumber":"2023-SLP-149"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"updated":"2025-01-19T10:49:03.808051+00:00","created":"2025-01-19T01:31:31.423692+00:00","links":{}}