{"links":{},"id":2009793,"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:02009793","sets":["1164:5064:1770876432362:1779319553198"]},"path":["1779319553198"],"owner":"80578","recid":"2009793","title":["ドメイン特化型の知覚的報酬を用いた強化学習によるアニメスタイル音声合成の最適化"],"pubdate":{"attribute_name":"PubDate","attribute_value":"2026-05-29"},"_buckets":{"deposit":"6d223125-81c7-49bd-b5bc-140693b18c20"},"_deposit":{"id":"2009793","pid":{"type":"depid","value":"2009793","revision_id":0},"owners":[80578],"status":"published","created_by":80578},"item_title":"ドメイン特化型の知覚的報酬を用いた強化学習によるアニメスタイル音声合成の最適化","author_link":[],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"ドメイン特化型の知覚的報酬を用いた強化学習によるアニメスタイル音声合成の最適化","subitem_title_language":"ja"},{"subitem_title":"Optimizing Anime-Style Speech Synthesis via Reinforcement Learning with a Domain-Specific Perceptual Reward","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"SP","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2026-05-29","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"Spellbrush"},{"subitem_text_value":"Spellbrush"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Spellbrush","subitem_text_language":"en"},{"subitem_text_value":"Spellbrush","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/2009793/files/IPSJ-MUS26146020.pdf","label":"IPSJ-MUS26146020.pdf"},"date":[{"dateType":"Available","dateValue":"9999-01-01"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-MUS26146020.pdf","filesize":[{"value":"1.4 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"0","billingrole":"21"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"d9760293-37e3-4264-8448-c9fbdf8d8c09","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2026 by the Institute of Electronics, Information and Communication Engineers This SIG report is only available to those in membership of the SIG."}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"朴,浚鎔"}]},{"creatorNames":[{"creatorName":"Jerry,Li"}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10438388","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8752","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"音声言語モデルによる音声合成は近年急速に進展しているが,アニメ声等の特定ドメインに特化されたスタイル制御は依然として課題である.既存の強化学習に基づく手法では,書き起こし誤り(CER)等の検証可能な報酬のみに依存することでプロソディが平板化したり,言語ドリフトが生じるといった問題が報告されている.また,UTMOSのような汎用的な平均オピニオンスコア(MOS)予測器は知覚的自然さを捕捉できる一方で,アニメ声らしさといったスタイル次元を直接的には捉えない.本稿では,アニメ声らしさを学習した知覚的分類器を強化学習における報酬として導入し,CERを硬い制約として併用する報酬設計を提案する.日本語ベースモデルでの学習に加え,同一手法を異なる規模および言語のモデルに転用した場合の挙動を観察し,得られた音声出力に対する自動スコアおよび人手聴取試験の双方を用いて分布シフトを検証する.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音楽情報科学(MUS)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2026-05-29","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"20","bibliographicVolumeNumber":"2026-MUS-146"}]},"relation_version_is_last":true,"weko_creator_id":"80578"},"created":"2026-05-21T06:17:17.776393+00:00","updated":"2026-05-21T06:17:23.859629+00:00"}