{"updated":"2025-01-19T08:32:26.687398+00:00","links":{},"id":238524,"created":"2025-01-19T01:41:48.400958+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00238524","sets":["1164:2735:11468:11707"]},"path":["11707"],"owner":"44499","recid":"238524","title":["転移学習を用いた高齢話者の音声認識率向上手法"],"pubdate":{"attribute_name":"公開日","attribute_value":"2024-08-29"},"_buckets":{"deposit":"28c01188-453d-45b3-9f3e-3ae2d10d9fa5"},"_deposit":{"id":"238524","pid":{"type":"depid","value":"238524","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"転移学習を用いた高齢話者の音声認識率向上手法","author_link":["653168","653164","653165","653169","653166","653167"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"転移学習を用いた高齢話者の音声認識率向上手法"},{"subitem_title":"Method for Improving Speech Recognition Rates for Elderly Speakers Using Transfer Learning","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2024-08-29","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"奈良女子大学"},{"subitem_text_value":"奈良女子大学"},{"subitem_text_value":"奈良女子大学"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Nara woman's University","subitem_text_language":"en"},{"subitem_text_value":"Nara woman's University","subitem_text_language":"en"},{"subitem_text_value":"Nara woman's University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/238524/files/IPSJ-MPS24150004.pdf","label":"IPSJ-MPS24150004.pdf"},"date":[{"dateType":"Available","dateValue":"2026-08-29"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-MPS24150004.pdf","filesize":[{"value":"678.0 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"17"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"50cc8c89-7d8a-423c-b2e7-8a2b4babcf8a","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"鎌田, 万由"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"千代延, 未帆"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"髙田, 雅美"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Mayu, Kamada","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Miho, Chiyonobu","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Masami, Takata","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10505667","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8833","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本稿では,高齢話者の発話を認識するための音声認識器の認識率改善を目的としている.音声認識器を開発する場合,明瞭な発音やノイズが少ない音声データを学習データとして用いることが一般的である.明瞭な発音やノイズの少ない音声データを使用した音声認識器を使用する場合,発音が不明瞭であったり,声に震えが生じやすい高齢話者の音声をテストデータとする場合,認識率が下がる.この認識率の低下を改善するために,転移学習を行い,学習データに加工した音声を用いる.本稿では,音声認識器である Whisper を用いて転移学習を行う.また,音声加工として高齢者の音声特性の 1 つである嗄声と,声の震えを再現するための加工を音声に施す.高齢者の嗄声を再現するために残差信号を変換するノイズ強調法を使用する.また,高齢者の声の震えを再現するためにトレモロを使用する.未加工の音声を学習データとして用いたものと加工した音声を学習データとして用いたものに対して高齢者の音声をテストデータとして与え,認識率の算出を行う.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"5","bibliographic_titles":[{"bibliographic_title":"研究報告数理モデル化と問題解決(MPS)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2024-08-29","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"4","bibliographicVolumeNumber":"2024-MPS-150"}]},"relation_version_is_last":true,"weko_creator_id":"44499"}}