{"updated":"2025-01-21T19:13:55.764041+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00081894","sets":["1164:5159:6679:6767"]},"path":["6767"],"owner":"11","recid":"81894","title":["リアルタイムクラウドソーシングとTwitter大規模コーパスを利用した対話システム"],"pubdate":{"attribute_name":"公開日","attribute_value":"2012-05-03"},"_buckets":{"deposit":"bcaf6fe8-2bd0-4a4c-8cd4-24d1c1fcc11c"},"_deposit":{"id":"81894","pid":{"type":"depid","value":"81894","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"リアルタイムクラウドソーシングとTwitter大規模コーパスを利用した対話システム","author_link":["0","0"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"リアルタイムクラウドソーシングとTwitter大規模コーパスを利用した対話システム"},{"subitem_title":"Dialog System Using Real-Time Crowdsourcing and Two-Length Tweet Corpus","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2012-05-03","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京大学"},{"subitem_text_value":"東京大学"},{"subitem_text_value":"東京大学"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"University of Tokyo","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/81894/files/IPSJ-SLP12091013.pdf"},"date":[{"dateType":"Available","dateValue":"2014-05-03"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-SLP12091013.pdf","filesize":[{"value":"1.2 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"22"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"124c6a6f-1c49-48ae-9d54-b9bfb3938c03","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2012 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"別所, 史浩"},{"creatorName":"原田, 達也"},{"creatorName":"國吉, 康夫"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Fumihiro, Bessho","creatorNameLang":"en"},{"creatorName":"Tatsuya, Harada","creatorNameLang":"en"},{"creatorName":"Yasuo, Kuniyoshi","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10442647","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"Twitter 大規模コーパスとリアルタイムクラウドソーシングの枠組みを利用した対話システムを提案する.我々のシステムは複雑な対話管理を行わず,ユーザ発話に対して最も近い発話をデータベース中から探し出し,それに対する応答をシステム応答として返す枠組みとなっている.またデータベース内に適切な応答が見つからなかったときには,その発言を即時に他ユーザにクラウドソースする.その際ユーザが匿名化され,かつクラウドソースをしていることを認知させないような仕組みを提案する.本論文ではまず,Twitter から日本語発話対を抽出し,内容を解析する.得られたデータの中で長さが 2 を超えるものは発話対全体の 58.3% であった.得られた発話対からの類似発話検索では,各種応答選択手法に対して AUC (Area Under the ROC Curve) を用いた性能の比較評価を行い,品詞フィルタリング,文書正規化,本研究における学習データの分類性能の向上に有効に働くことが示された.実装されたシステムの評価実験を通じて,システムの用いるデータ数の増加は,多くの場合システム性能の向上に寄与するが,一定の値において有意に性能が下落することが観測された.また,クラウドソースを含めた実験を通じて,クラウドソースの枠組みの導入でユーザがシステムとの対話の中に面白さを感じるようになることが示された.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"We propose a dialog system that creates responses based on a 2-length tweets database and real-time crowdsourcing. Our system replies with the utterance from the database that is most similar to the user input. We also propose a real-time crowdsourcing framework for handling the case in which there is no adequate response in the database. The response scoring function is designed and evaluated using a survey, based on which positive/negative utterance pairs are created. We examine the effect of data size and real-time crowdsourcing on system response. Our results show that system performance improves with increasing amount of data in many case, but not always, and crowdsourcing framework enhances amusingness of the system.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"8","bibliographic_titles":[{"bibliographic_title":"研究報告音声言語情報処理(SLP)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2012-05-03","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"13","bibliographicVolumeNumber":"2012-SLP-91"}]},"relation_version_is_last":true,"weko_creator_id":"11"},"created":"2025-01-18T23:35:55.594420+00:00","id":81894,"links":{}}