{"links":{},"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00217725","sets":["581:10784:10788"]},"path":["10788"],"owner":"44499","recid":"217725","title":["日本語逐次音声合成における合成単位"],"pubdate":{"attribute_name":"公開日","attribute_value":"2022-04-15"},"_buckets":{"deposit":"36fde966-b83a-4399-b17c-ec7ead33ecba"},"_deposit":{"id":"217725","pid":{"type":"depid","value":"217725","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"日本語逐次音声合成における合成単位","author_link":["564566","564561","564562","564563","564565","564564"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"日本語逐次音声合成における合成単位"},{"subitem_title":"Synthesis Unit for Japanese Incremental Text-to-Speech","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"[一般論文] 同時音声通訳システム，逐次音声合成，アクセント句，日本語","subitem_subject_scheme":"Other"}]},"item_type_id":"2","publish_date":"2022-04-15","item_2_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"奈良先端科学技術大学院大学"},{"subitem_text_value":"北陸先端科学技術大学院大学／奈良先端科学技術大学院大学／理化学研究所観光情報解析チーム"},{"subitem_text_value":"奈良先端科学技術大学院大学／理化学研究所観光情報解析チーム"}]},"item_2_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"NAIST","subitem_text_language":"en"},{"subitem_text_value":"JAIST / NAIST / RIKEN AIP","subitem_text_language":"en"},{"subitem_text_value":"NAIST / RIKEN AIP","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/217725/files/IPSJ-JNL6304023.pdf","label":"IPSJ-JNL6304023.pdf"},"date":[{"dateType":"Available","dateValue":"2024-04-15"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-JNL6304023.pdf","filesize":[{"value":"1.0 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"8"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"4a3b7e1c-ebc0-4346-af58-3899b8c23087","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2022 by the Information Processing Society of Japan"}]},"item_2_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"柳田, 智也"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"サクテイ, サクリアニ"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"中村, 哲"}],"nameIdentifiers":[{}]}]},"item_2_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Tomoya, Yanagita","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Sakriani, Sakti","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Satoshi, Nakamura","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_2_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN00116647","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_2_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7764","subitem_source_identifier_type":"ISSN"}]},"item_2_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"同時音声通訳システムは，話者の発話中に翻訳を行い音声を生成する．その実現のために，文より短いテキストから，音声を生成する逐次音声合成が必要である．本論文は，同時音声通訳システムの実現を目指して，日本語における逐次音声合成の提案を目的とする．先行研究は，逐次音声合成のために使用する言語特徴を制限し，合成範囲を単語としている．しかし，日本語音声合成は，アクセント句と呼ばれる単位が重要であり，単語の逐次音声合成が，音声品質と遅延のトレードオフとして適さない可能性がある．本論文では，日本語逐次音声合成のため，逐次音声合成の言語特徴を提案する．そして，言語特徴の組合せから，遅延と音声品質に最適な合成範囲を決定する．実験結果より，アクセント句から呼気段落の合成範囲が音声の品質を保持するために必要であることを示した．さらに，遅延評価を通して，アクセント句が日本語の逐次音声合成へ適することを示した．","subitem_description_type":"Other"}]},"item_2_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"A simultaneous speech translation system translates while the speaker speaks and generates speech sequentially. To construct the system, an incremental Text-to-speech (iTTS) system which synthesizes a speech in a shorter synthesis unit is required. This work proposes a Japanese iTTS system for the simultaneous speech translation. Most of the researchers used the word unit as the synthesis unit. However, in Japanese speech synthesis, a unit called an accent phrase is important, and word-by-word synthesis may not be suitable. In this paper, we propose a linguistic feature and synthesis unit for Japanese iTTS. Experimental result shows that accent phrase or breath group are essential for a Japanese iTTS system as a trade-off between quality and synthesis units for the Japanese iTTS. Then, an accent phrase is a more appropriate incremental synthesis unit than a breath group through delay analysis.","subitem_description_type":"Other"}]},"item_2_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"1158","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌"}],"bibliographicPageStart":"1149","bibliographicIssueDates":{"bibliographicIssueDate":"2022-04-15","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"4","bibliographicVolumeNumber":"63"}]},"relation_version_is_last":true,"item_2_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.20729/00217617","subitem_identifier_reg_type":"JaLC"}]},"weko_creator_id":"44499"},"updated":"2025-01-19T15:24:08.210118+00:00","created":"2025-01-19T01:18:12.287772+00:00","id":217725}