{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00218524","sets":["1164:5159:10869:10940"]},"path":["10940"],"owner":"44499","recid":"218524","title":["クラウドソーシングを用いた合成音声の音質主観評価のためのワーカ選抜基準"],"pubdate":{"attribute_name":"公開日","attribute_value":"2022-06-10"},"_buckets":{"deposit":"46dae0e5-98ee-4e65-9517-78714627da10"},"_deposit":{"id":"218524","pid":{"type":"depid","value":"218524","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"クラウドソーシングを用いた合成音声の音質主観評価のためのワーカ選抜基準","author_link":["568386","568387","568389","568385","568390","568391","568392","568388"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"クラウドソーシングを用いた合成音声の音質主観評価のためのワーカ選抜基準"},{"subitem_title":"Worker Filtering Criteria for Subjective Evaluation of Sound Quality of Synthesized Voice Using Crowdsourcing","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"ポスターセッション4","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2022-06-10","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"早稲田大学"},{"subitem_text_value":"早稲田大学／株式会社知能フレームワーク研究所"},{"subitem_text_value":"早稲田大学／株式会社知能フレームワーク研究所"},{"subitem_text_value":"早稲田大学"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Waseda University","subitem_text_language":"en"},{"subitem_text_value":"Waseda University / Intelligent Framework Lab Inc.","subitem_text_language":"en"},{"subitem_text_value":"Waseda University / Intelligent Framework Lab Inc.","subitem_text_language":"en"},{"subitem_text_value":"Waseda University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/218524/files/IPSJ-SLP22142065.pdf","label":"IPSJ-SLP22142065.pdf"},"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-SLP22142065.pdf","filesize":[{"value":"2.1 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"0","billingrole":"22"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_login","version_id":"9d1c87bf-4474-4b10-bc48-24ffe573d3c2","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2022 by the Institute of Electronics, Information and Communication Engineers This SIG report is only available to those in membership of the SIG."}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"八重樫, 萌絵"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"斎藤, 奨"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"中野, 鐵兵"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"小川, 哲司"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Moe, Yaegashi","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Susumu, Saito","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Teppei, Nakano","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tetsuji, Ogawa","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10442647","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8663","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"クラウドソーシングを用いた合成音声の主観評価において，クラウドワーカの選抜基準が評価結果に与える影響を調査した．現在，合成音声の主観評価においてクラウドソーシングの利活用が進んでいる．その際，所望する条件を満たすワーカに対してのみ評価を依頼できることが望ましいが，合成音声の主観評価においてそのようなワーカ選抜基準は確立されていない．それに対し本研究では，音質（歪みの度合い）の評価に焦点を当て，合成音声主観評価のためのワーカ選抜基準について検討を行った．選抜試験では，音質の違いを聞き分ける能力を評価可能にするために，抑揚，音質以外の属性は同一となるように比較タスクを設計した．さらに，ワーカが音質の違いを直感的に理解できるように，選抜試験の冒頭で歪みの多い音声を複数回連続して提示した．Amazon Mechanical Turk 上で音質評価実験を行い，i) 歪みの量に着目して評価をしているか（意図理解度），ii) 回答に整合性はあるか（回答整合率），iii) 確信をもって回答しているか（回答確信度），といった選抜基準が主観評価結果に与える影響を調査した．その結果，意図理解や回答に対する確信の度合いの測定はワーカの選抜において有効であり，そのためには，意図理解に役立つサンプル（ここでは，音質が悪い音声）を数サンプル用意して比較タスクに含めれば良いことが明らかになった．","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"We investigate the eﬀect of ﬁltering criteria of crowdworkers on the subjective evaluation results of synthesized voice using crowdsourcing. Currently, crowdsourcing has been used for subjective evaluation of synthesized voice. Although it is desirable to remove workers who do not satisfy the client’s requirements, worker ﬁltering criteria have not yet been deﬁned. In this study, we focused on subjective evaluation of sound quality (amount of distortion) and examined ﬁltering criteria. In the ﬁltering test, the comparison task was designed so that attributes other than intonation and sound quality were identical in order to enable evaluation of the ability to distinguish diﬀerences in sound quality. In order for the worker to understand the diﬀerence in sound quality intuitively, we showed the workers the highly distorted voice several times repeatedly at the beginning of the evaluation. We conducted sound quality evaluation experiments on Amazon Mechanical Turk to investigate the eﬀects of the following ﬁltering criteria on the subjective evaluation results: i) whether the evaluation was focused on the amount of distortion (Understanding of Intent), ii) whether the responses were consistent (Response Consistency Rate), iii) whether the responses were given with conﬁdence (Response Conﬁdence). The results showed that measuring the degree of Understanding of Intentions and Response Conﬁdence is eﬀective in worker selection, and this can be achieved by including a few samples that are useful for Understanding of Intention (in this study, low sound quality voice) in the comparison task.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音声言語情報処理（SLP）"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2022-06-10","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"65","bibliographicVolumeNumber":"2022-SLP-142"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":218524,"updated":"2025-01-19T15:08:02.001566+00:00","links":{},"created":"2025-01-19T01:18:53.513856+00:00"}