{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00073738","sets":["1164:3782:6270:6383"]},"path":["6383"],"owner":"10","recid":"73738","title":["電子書籍の論理構造に基づくポーズ情報の推定とSSML構造化"],"pubdate":{"attribute_name":"公開日","attribute_value":"2011-03-21"},"_buckets":{"deposit":"9230689d-2eb3-44f8-9f20-4a93903082da"},"_deposit":{"id":"73738","pid":{"type":"depid","value":"73738","revision_id":0},"owners":[10],"status":"published","created_by":10},"item_title":"電子書籍の論理構造に基づくポーズ情報の推定とSSML構造化","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"電子書籍の論理構造に基づくポーズ情報の推定とSSML構造化"},{"subitem_title":"Pause estimation based on e-book logical structures and SSML transformation","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"電子書籍","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2011-03-21","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東芝研究開発センター"},{"subitem_text_value":"東芝研究開発センター"},{"subitem_text_value":"東芝研究開発センター"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"TOSHIBA CORPORATION Corporate Research & Development Center","subitem_text_language":"en"},{"subitem_text_value":"TOSHIBA CORPORATION Corporate Research & Development Center","subitem_text_language":"en"},{"subitem_text_value":"TOSHIBA CORPORATION Corporate Research & Development Center","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/73738/files/IPSJ-DD11080006.pdf"},"date":[{"dateType":"Available","dateValue":"2013-03-21"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-DD11080006.pdf","filesize":[{"value":"398.3 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"32"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"2146df96-4995-489d-931b-e2a941002441","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2011 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"布目, 光生"},{"creatorName":"鈴木, 優"},{"creatorName":"森田, 眞弘"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Kosei, Fume","creatorNameLang":"en"},{"creatorName":"Masaru, Suzuki","creatorNameLang":"en"},{"creatorName":"Masahiro, Morita","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10539261","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"電子書籍を音声合成で読み上げる場合に,文書の書式特徴を活用してより聞きやすい朗読を実現するテキスト前処理手段を提案する.文を処理の基本単位とする従来の発話手法では困難な,タイトルや箇条書きと本文を区別したような読み方や,文書全体の構成や流れを考慮したような,自然な読み上げの実現を目指す.今回,具体的なアプローチとして,入力文書テキストの特徴量として論理構造をはじめとする抽出手段と,特にポーズ情報に関連したメタデータの推定手段,そして,音声合成エンジンへ提供するための XML 化,という一連のテキスト処理機能の試作と,ポーズ情報の付与精度評価を行った.本報告では,これらの手法と評価実験結果について述べる.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"We conduct feasibility studies for the development of a text preprocessing technique that uses document formatting features for improved natural speech synthesis with the aim of targeting e-book readers. In traditional text-to-speech (TTS) systems, it is difficult to implement a feature by which the different document elements such as the document body, title, and itemized forms are read in a suitable tone. We implement certain functionalities, namely a sentence characteristics extractor that determines the logical nature of a document element, a metadata estimator that generates pause information, and a transformer that converts these results to speech synthesis markup language, which a TTS system can process. Details about these processes and experimental results of a simple implementation of pause estimation are described in this report.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"7","bibliographic_titles":[{"bibliographic_title":"研究報告デジタルドキュメント(DD)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2011-03-21","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"6","bibliographicVolumeNumber":"2011-DD-80"}]},"relation_version_is_last":true,"weko_creator_id":"10"},"id":73738,"updated":"2025-01-21T21:49:55.389114+00:00","links":{},"created":"2025-01-18T23:31:33.783414+00:00"}