{"created":"2025-01-19T01:16:50.818966+00:00","updated":"2025-01-19T15:54:58.536493+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00216123","sets":["1164:5064:10822:10823"]},"path":["10823"],"owner":"44499","recid":"216123","title":["声質の可視化を用いた所望音声検索システムの提案"],"pubdate":{"attribute_name":"公開日","attribute_value":"2022-01-18"},"_buckets":{"deposit":"09461997-82a7-46da-89b9-4cd7ef5233c7"},"_deposit":{"id":"216123","pid":{"type":"depid","value":"216123","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"声質の可視化を用いた所望音声検索システムの提案","author_link":["557550","557555","557551","557553","557554","557552","557549"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"声質の可視化を用いた所望音声検索システムの提案"}]},"item_type_id":"4","publish_date":"2022-01-18","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"名古屋大学情報学研究科"},{"subitem_text_value":"名古屋大学情報基盤センター"},{"subitem_text_value":"名古屋大学未来社会創造機構/株式会社ティアフォー"},{"subitem_text_value":"名古屋大学情報基盤センター"},{"subitem_text_value":"名古屋大学情報学研究科"},{"subitem_text_value":"名城大学都市情報学部"},{"subitem_text_value":"名古屋大学未来社会創造機構/株式会社ティアフォー"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/216123/files/IPSJ-MUS22133006.pdf","label":"IPSJ-MUS22133006.pdf"},"date":[{"dateType":"Available","dateValue":"2024-01-18"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-MUS22133006.pdf","filesize":[{"value":"823.4 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"21"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"7a3e69c4-b7c8-4014-8314-04d33610632d","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2022 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"佐治, 拓樹"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"小林, 和弘"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"石黒, 祥生"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"戸田, 智基"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"大谷, 健登"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"西野, 隆典"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"武田, 一哉"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10438388","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8752","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"声質変換や歌声合成は,元となる音源データを入れ替えることにより,合成後の声質を容易に変更することができる.しかし,公開されている音声データセットは膨大なため,所望の声質のデータを探索することは非常に困難である.本研究では,声質の可視化を行い,その視覚情報を利用した声質検索システムの提案を行う.声質の可視化には,話者コードによって話者の特徴量を表現するサブネットワークを接続した VQVAE による声質変換モデルを使用する.サブネットワークで表現された各話者の特徴量を主成分分析によって二次元に削減することで,散布図の形で声質の可視化を行う.出力図の点をクリックすると対応した話者のサンプル音声を聞くことができるので,ユーザは可視化した図と実際に聞いた音声の関係を把握しながら所望の声質を探索していく.また,ユーザがシステムに探索したい声を声真似した音声を入力することで,出力図の改善を試みた.その結果,声真似を利用することで,データセットを可視化しただけの手法よりも探索の効率化を行えることがわかった.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"5","bibliographic_titles":[{"bibliographic_title":"研究報告音楽情報科学(MUS)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2022-01-18","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"6","bibliographicVolumeNumber":"2022-MUS-133"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":216123,"links":{}}