{"links":{},"id":169883,"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00169883","sets":["1164:5159:8497:8861"]},"path":["8861"],"owner":"11","recid":"169883","title":["講演のリアルタイム字幕付与のための音声認識結果の簡約"],"pubdate":{"attribute_name":"公開日","attribute_value":"2016-07-21"},"_buckets":{"deposit":"b9940a96-766e-4bdc-8d83-7fd65f30930a"},"_deposit":{"id":"169883","pid":{"type":"depid","value":"169883","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"講演のリアルタイム字幕付与のための音声認識結果の簡約","author_link":["341911","341908","341912","341909","341907","341910"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"講演のリアルタイム字幕付与のための音声認識結果の簡約"},{"subitem_title":"Condensation of Speech Recognition Results for Real-Time Lecture Captioning","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"言語モデル・簡約","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2016-07-21","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"京都大学情報学研究科"},{"subitem_text_value":"京都大学経済学研究科"},{"subitem_text_value":"京都大学情報学研究科"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Informatics, Kyoto University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Economics, Kyoto University","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Informatics, Kyoto University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/169883/files/IPSJ-SLP16112012.pdf","label":"IPSJ-SLP16112012.pdf"},"date":[{"dateType":"Available","dateValue":"2018-07-21"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-SLP16112012.pdf","filesize":[{"value":"482.5 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"22"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"c7fc3f79-ecdb-4f96-9a06-bea6d1b2fc79","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2016 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"大田, 健翔"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"秋田, 祐哉"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"河原, 達也"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Kensho, Ota","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Yuya, Akita","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tatsuya, Kawahara","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10442647","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8663","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本研究では,聴覚障がい者への情報保障のために,講演に対する音声認識を用いたリアルタイムの字幕付与を扱う.話し言葉を音声認識で書き起こす際には,冗長な語句も認識結果として出力されるため文字数が増えて読みにくくなる.そこで本研究では,文意を保存しつつ冗長な語句を削減する簡約処理を検討する.具体的には,講演内容を理解するにあたって必要な単語 (内容語) とそうでない単語 (付属語) に分類し,原則として後者を削除し前者のみを残して字幕として提示する.この原則にあてはまらないものがあるので,内容語で削除するものをアノテーション頻度の比率に基づいて決定し,付属語で復元するものをアノテーション頻度の比率,N-gram による言語尤度比較,機械学習を用いる方法で決定する.講演音声の書き起こしに対して簡約処理を行った結果,正解率 78%・圧縮率 64%で文を圧縮することができた.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"We have been investigating a real-time captioning framework using automatic speech recognition (ASR) technology for hearing-impaired audience. Since an ASR system transcribes all of speech input, including redundant spoken expressions, resulting captions are very long and thus hard to read and understand. To solve this problem, we propose a “condensation” method, which reduces unnecessary expressions in ASR results as much as possible while retaining key meaning of the utterances. Specifically, each word in ASR results is classified into a content word or a dependent word. Basically, the latter is deleted, while the former is retained for captions. However, there are exceptions in this principle, thus we further introduce refinement process. Redundant content words to be deleted are determined using occurrence counts in annotated training data. On the other hand, for recovery of dependent words, we investigate three methods: occurrence counts in annotated training data, linguistic likelihood measure calculated by an N-gram language model, and a machine learning framework. In an experiment over real lecture transcriptions, word-based compression rate of 64% and accuracy of 78% was obtained.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音声言語情報処理(SLP)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2016-07-21","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"12","bibliographicVolumeNumber":"2016-SLP-112"}]},"relation_version_is_last":true,"weko_creator_id":"11"},"created":"2025-01-19T00:40:36.727037+00:00","updated":"2025-01-20T08:49:20.967932+00:00"}