{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00069905","sets":["1164:5159:6009:6133"]},"path":["6133"],"owner":"10","recid":"69905","title":["雑音下マルチモーダル音声認識評価基盤CENSREC-1-AVの構築"],"pubdate":{"attribute_name":"公開日","attribute_value":"2010-07-15"},"_buckets":{"deposit":"810f082b-b2b0-4b44-9b57-788f43751d7b"},"_deposit":{"id":"69905","pid":{"type":"depid","value":"69905","revision_id":0},"owners":[10],"status":"published","created_by":10},"item_title":"雑音下マルチモーダル音声認識評価基盤CENSREC-1-AVの構築","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"雑音下マルチモーダル音声認識評価基盤CENSREC-1-AVの構築"},{"subitem_title":"CENSREC-1-AV An evaluation framework for multimodal speech recognition","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"頑健な音声認識","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2010-07-15","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"岐阜大学"},{"subitem_text_value":"名古屋大学"},{"subitem_text_value":"名古屋大学"},{"subitem_text_value":"名古屋大学"},{"subitem_text_value":"筑波大学"},{"subitem_text_value":"神戸大学"},{"subitem_text_value":"大同大学"},{"subitem_text_value":"豊橋技術科学大学"},{"subitem_text_value":"立命館大学"},{"subitem_text_value":"近畿大学"},{"subitem_text_value":"村田機械"},{"subitem_text_value":"NTTコミュニケーション科学基礎研究所"},{"subitem_text_value":"情報通信研究機構"},{"subitem_text_value":"早稲田大学"},{"subitem_text_value":"千葉大学"},{"subitem_text_value":"情報通信研究機構"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Gifu University","subitem_text_language":"en"},{"subitem_text_value":"Nagoya University","subitem_text_language":"en"},{"subitem_text_value":"Nagoya University","subitem_text_language":"en"},{"subitem_text_value":"Nagoya University","subitem_text_language":"en"},{"subitem_text_value":"University of Tsukuba","subitem_text_language":"en"},{"subitem_text_value":"Kobe University","subitem_text_language":"en"},{"subitem_text_value":"Daido University","subitem_text_language":"en"},{"subitem_text_value":"Toyohashi University of Technology","subitem_text_language":"en"},{"subitem_text_value":"Ritsumeikan University","subitem_text_language":"en"},{"subitem_text_value":"Kinki University","subitem_text_language":"en"},{"subitem_text_value":"Murata Machinery","subitem_text_language":"en"},{"subitem_text_value":"NTT Communication Science Laboratories","subitem_text_language":"en"},{"subitem_text_value":"National Institute of Information and Communications Technology","subitem_text_language":"en"},{"subitem_text_value":"Waseda University","subitem_text_language":"en"},{"subitem_text_value":"Chiba University","subitem_text_language":"en"},{"subitem_text_value":"National Institute of Information and Communications Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/69905/files/IPSJ-SLP10082007.pdf"},"date":[{"dateType":"Available","dateValue":"2012-07-15"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-SLP10082007.pdf","filesize":[{"value":"695.8 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"22"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"6695bc02-833a-41c4-85e7-cc4cfd21d07b","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2010 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"田村, 哲嗣"},{"creatorName":"宮島, 千代美"},{"creatorName":"北岡, 教英"},{"creatorName":"武田, 一哉"},{"creatorName":"山田, 武志"},{"creatorName":"滝口, 哲也"},{"creatorName":"柘植, 覚"},{"creatorName":"山本, 一公"},{"creatorName":"西浦, 敬信"},{"creatorName":"中山, 雅人"},{"creatorName":"傳田, 遊亀"},{"creatorName":"藤本, 雅清"},{"creatorName":"松田, 繁樹"},{"creatorName":"小川, 哲司"},{"creatorName":"黒岩, 眞吾"},{"creatorName":"中村, 哲"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Satoshi, Tamura","creatorNameLang":"en"},{"creatorName":"Chiyomi, Miyajima","creatorNameLang":"en"},{"creatorName":"Norihide, Kitaoka","creatorNameLang":"en"},{"creatorName":"Kazuya, Takeda","creatorNameLang":"en"},{"creatorName":"Takeshi, Yamada","creatorNameLang":"en"},{"creatorName":"Tetsuya, Takiguchi","creatorNameLang":"en"},{"creatorName":"Satoru, Tsuge","creatorNameLang":"en"},{"creatorName":"Kazumasa, Yamamoto","creatorNameLang":"en"},{"creatorName":"Takanobu, Nishiura","creatorNameLang":"en"},{"creatorName":"Masato, Nakayama","creatorNameLang":"en"},{"creatorName":"Yuki, Denda","creatorNameLang":"en"},{"creatorName":"Masakiyo, Fujimoto","creatorNameLang":"en"},{"creatorName":"Shigeki, Matsuda","creatorNameLang":"en"},{"creatorName":"Tetsuji, Ogawa","creatorNameLang":"en"},{"creatorName":"Shingo, Kuroiwa","creatorNameLang":"en"},{"creatorName":"Satoshi, Nakamura","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10442647","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本稿では,音声と画像を用いたマルチモーダル音声認識の共通評価基盤 CENSREC-1-AV について紹介する.CENSREC-1-AV では,音声・画像データベースおよびベースラインシステムを提供する.音声は学習用クリーンデータのほか,乗用車走行雑音を付与したものを収録した.画像はカラー映像と近赤外線映像を収録し,ガンマ補正を用いて乗用車走行シミュレーション画像をテストデータとした.ベースラインシステムでは,MFCC と,固有顔ないしはオプティカルフローを特徴量として,マルチストリーム HMM により認識を行った.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"This paper introduces an evaluation framework for multimodal speech recognition: CENSREC-1-AV. The corpus CENSREC-1-AV provides an audiovisual speech database and a baseline system of multimodal speech recognition. Speech signals were recorded in clean condition for training and in-car noises were overlapped for testing. Color and infrared pictures were captured as training data, and image corruption was conducted for testing using the gamma correction technique. In the baseline system, acoustic MFCC as well as eigenface or optical-flow information are adopted as audio and visual features respectively, then multi-stream HMMs are used as a recognition model.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音声言語情報処理(SLP)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2010-07-15","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"7","bibliographicVolumeNumber":"2010-SLP-82"}]},"relation_version_is_last":true,"weko_creator_id":"10"},"id":69905,"updated":"2025-01-21T23:42:50.480632+00:00","links":{},"created":"2025-01-18T23:29:15.173272+00:00"}