{"links":{},"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00232474","sets":["1164:5159:11541:11549"]},"path":["11549"],"owner":"44499","recid":"232474","title":["年齢情報とのマルチタスク学習による高齢者音声認識の高精度化"],"pubdate":{"attribute_name":"公開日","attribute_value":"2024-02-22"},"_buckets":{"deposit":"86e4c63b-234b-4213-9488-190625d75aba"},"_deposit":{"id":"232474","pid":{"type":"depid","value":"232474","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"年齢情報とのマルチタスク学習による高齢者音声認識の高精度化","author_link":["629277","629275","629276","629278","629281","629279","629282","629280"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"年齢情報とのマルチタスク学習による高齢者音声認識の高精度化"},{"subitem_title":"Multi-task learning with age information model for highly accurate elderly speech recognition.","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"SP1","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2024-02-22","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"豊橋技術科学大学"},{"subitem_text_value":"豊橋技術科学大学"},{"subitem_text_value":"豊橋技術科学大学"},{"subitem_text_value":"豊橋技術科学大学"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Toyohashi Uniersity of Technology","subitem_text_language":"en"},{"subitem_text_value":"Toyohashi Uniersity of Technology","subitem_text_language":"en"},{"subitem_text_value":"Toyohashi Uniersity of Technology","subitem_text_language":"en"},{"subitem_text_value":"Toyohashi Uniersity of Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/232474/files/IPSJ-SLP24151004.pdf","label":"IPSJ-SLP24151004.pdf"},"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-SLP24151004.pdf","filesize":[{"value":"1.4 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"0","billingrole":"22"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_login","version_id":"3cd67713-b06b-4600-82dd-21ae47b6196b","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Institute of Electronics, Information and Communication Engineers This SIG report is only available to those in membership of the SIG."}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"新惠, 拓実"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"木内, 貴浩"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"若林, 佑幸"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"北岡, 教英"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Takumi, Shine","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Takahiro, Kinouchi","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Yukoh, Wakabayashi","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Norihide, Kitaoka","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10442647","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8663","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"高齢者の音声は,一般にスマートスピーカーなどに使用されている音声認識機では一般話者に比べて精度が低くなってしまう.これは高齢者音声には発声器官の衰えや間延びの増加,発話速度の低下などがあり,音響的特徴量に差があることが原因とされている.また,高齢者音声データは収録が容易ではなく,データ量が少ないといった事も高齢者音声の認識精度を向上できない理由の一つとして挙げられる.本研究では,年齢推定タスクを同時に行うマルチタスクモデルを用いることで,認識精度の向上を試みた.一つ目に,純粋に年齢推定を行いながら音声認識を行うことで年齢情報を考慮した音声認識が可能になるモデルを構築した.二つ目に,年齢推定タスクと音声認識タスクで敵対的マルチタスク学習を行うことで,一般成人と高齢者に共通する年齢不変な音響特徴量を抽出し,学習を進めることで認識精度の向上を狙うモデルを構築した.また,三つ目に年齢推定器を改良したマルチタスク学習モデルを構築した.これらのモデルの精度を比較し,考察を行った.結果として高齢者の音声だけでなく一般成人に対する認識精度も改善でき,マルチタスク学習の有用性を示した.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"The speech recognition of the elderly is less accurate, especially in smart speaker speech recognition, due to aging-related factors such as vocal organ deterioration, increased pauses, and decreased speech rate, leading to differences in acoustic features. Challenges include difficulty in recording elderly speech and limited data availability. The aim of this study is to enhance the accuracy of elderly speech recognition. As a proposed method, we built two models: one integrating age estimation into the speech recognition model and another employing adversarial multitask learning with GAN framework. Comparing the accuracy of these models revealed improved recognition for both elderly and general adult speech, demonstrating the effectiveness of the multitasking approach.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音声言語情報処理(SLP)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2024-02-22","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"4","bibliographicVolumeNumber":"2024-SLP-151"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"created":"2025-01-19T01:33:21.774645+00:00","updated":"2025-01-19T10:26:10.171943+00:00","id":232474}