{"id":218454,"updated":"2025-01-19T15:09:23.966560+00:00","links":{},"created":"2025-01-19T01:18:49.413786+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00218454","sets":["1164:5064:10822:10948"]},"path":["10948"],"owner":"44499","recid":"218454","title":["双曲空間への音色埋め込みを用いたガウス混合変分自己符号化器による楽音合成の検討"],"pubdate":{"attribute_name":"公開日","attribute_value":"2022-06-10"},"_buckets":{"deposit":"bbfd24e4-5862-4f09-9801-8494be5663b1"},"_deposit":{"id":"218454","pid":{"type":"depid","value":"218454","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"双曲空間への音色埋め込みを用いたガウス混合変分自己符号化器による楽音合成の検討","author_link":["568074","568071","568073","568075","568072"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"双曲空間への音色埋め込みを用いたガウス混合変分自己符号化器による楽音合成の検討"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"ポスターセッション4","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2022-06-10","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京大学"},{"subitem_text_value":"東京大学"},{"subitem_text_value":"東京大学"},{"subitem_text_value":"産業技術総合研究所"},{"subitem_text_value":"東京大学"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"the University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"the University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"the University of Tokyo","subitem_text_language":"en"},{"subitem_text_value":"National Institute of Advanced Industrial Science and Technology (AIST)","subitem_text_language":"en"},{"subitem_text_value":"the University of Tokyo","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/218454/files/IPSJ-MUS22134062.pdf","label":"IPSJ-MUS22134062.pdf"},"date":[{"dateType":"Available","dateValue":"2024-06-10"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-MUS22134062.pdf","filesize":[{"value":"441.2 kB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"21"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"380610ef-4f41-4afa-bb2d-f8b3e7707735","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2022 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"中島, 風太"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"中村, 友彦"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"高宗, 典玄"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"深山, 覚"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"猿渡, 洋"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10438388","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8752","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"本稿では,音色の階層性を考慮した変分自己符号化器(variational autoencoder: VAE)による楽音合成法を提案する.VAE に基づく楽音合成では,楽器音をその特徴を捉えた低次元な潜在空間に射影しそこから再構成できるよう学習する.潜在空間で効率的な表現を得るためには,データの性質を反映した潜在空間を構築することが重要である.これに対し,本稿では物理的な機構に基づく楽器分類体系には階層性が存在することに着眼し,音色に関する潜在変数を階層性のあるデータを効率的に表現できる双曲空間上で定義した VAE を提案する.提案法は,音色と音高を別々の潜在空間で扱うことのできる従来法を拡張し,音色に関する潜在変数の事前分布として双曲空間上の正規分布(擬似双曲正規分布)を導入する.また,擬似双曲正規分布の導入を行っても,従来法と同様に確率的勾配降下法を用いて学習できることを示す.実験により,音色に関する潜在空間において,Euclid 空間を用いる場合に比べ双曲空間を用いることで,同一楽器類はより近く,異種楽器類はより遠くへと埋め込まれることが示唆された.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"8","bibliographic_titles":[{"bibliographic_title":"研究報告音楽情報科学(MUS)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2022-06-10","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"62","bibliographicVolumeNumber":"2022-MUS-134"}]},"relation_version_is_last":true,"weko_creator_id":"44499"}}