{"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00232512","sets":["1164:5159:11541:11549"]},"path":["11549"],"owner":"44499","recid":"232512","title":["IVAとDNNを近接平均化した優決定BSSに用いるDNNのアーキテクチャの比較"],"pubdate":{"attribute_name":"公開日","attribute_value":"2024-02-22"},"_buckets":{"deposit":"451dc2f1-c84c-42ec-a3d4-88167c022ca9"},"_deposit":{"id":"232512","pid":{"type":"depid","value":"232512","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"IVAとDNNを近接平均化した優決定BSSに用いるDNNのアーキテクチャの比較","author_link":["629485","629488","629487","629484","629483","629486"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"IVAとDNNを近接平均化した優決定BSSに用いるDNNのアーキテクチャの比較"},{"subitem_title":"Comparison of DNN architectures for determined BSS by proximal average of IVA and DNN","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"ポスターセッション1 SIP/EA","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2024-02-22","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"早稲田大学基幹理工学部;東京農工大学工学部"},{"subitem_text_value":"東京農工大学工学部"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"School of Fundamental Science and Engineering, Waseda University","subitem_text_language":"en"},{"subitem_text_value":"Faculty of Engineering, Tokyo University of Agriculture and Technology","subitem_text_language":"en"},{"subitem_text_value":"Faculty of Engineering, Tokyo University of Agriculture and Technology","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/232512/files/IPSJ-SLP24151042.pdf","label":"IPSJ-SLP24151042.pdf"},"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-SLP24151042.pdf","filesize":[{"value":"1.1 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"0","billingrole":"22"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_login","version_id":"08e573ef-985e-4721-b29c-9298b2dbd8ad","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Institute of Electronics, Information and Communication Engineers This SIG report is only available to those in membership of the SIG."}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"松本, 和樹"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"山田, 宏樹"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"矢田部, 浩平"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Kazuki, Matsumoto","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Koki, Yamada","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Kohei, Yatabe","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10442647","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8663","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"我々はこれまで,Plug-and-Play と近接平均(PA)の枠組みに基づき,深層ニューラルネットワーク(DNN)による雑音除去器を用いて高性能な分離行列推定を実現するフレームワーク(PA-BSS)を提案した.PA-BSS は,独立ベクトル分析(IVA)と DNN の近接平均を主双対近接分離(PDS)アルゴリズムに Plug-and-Play することで,IVA の安定した分離能力と DNN の緻密な音源モデリング能力を両立した音源分離を実現する.しかし,どのような DNNを用いれば高い分離性能が得られ,アルゴリズムが良好な収束性を示すのかに関しては十分な検討がなされていない.そこで本稿では,2 種類の推定器と 3 種類の推定対象を用いた計 6 種類の DNN を用いて PA-BSS による音源分離を試み,各 DNN の性質とそれらを用いた PA-BSS の性能を評価した.推定器に関しては(1) Encoder-Decoder 型の Fully Convolutional Network,(2)U-Net の 2 種類を用いた.また,それらの推定対象に関しては,(1)目的音の振幅,(2)雑音成分の振幅,(3)目的音抽出マスクの 3 種類を比較した.結果として,U-Net により雑音成分を推定するアーキテクチャが分離性能,頑健性,アルゴリズムの収束性の観点で優れることが分かった.","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"We have proposed a framework called PA-BSS for high-performance separation matrix estimation using deep denoisers based on the framework of plug-and-play and proximal average (PA). By plug-and-play of proximal average of IVA and DNN into the primal-dual splitting (PDS) algorithm, PA-BSS achieves source separation that combines the stable separation capability of IVA with the detailed source modeling capability of DNNs. However, what kind of DNNs can achieve high separation performance and preferable algorithm convergence has not been thoroughly investigated. In this paper, we explore the properties of six different DNNs which are the conbinations of two estimators and three estimation targets. The two estimators are (1) encoder-decoder type fully convolutional networks and (2) U-Net. As for the estimation targets, we use (1) the amplitude of the target source, (2) the amplitude of noise components, and (3) the time-frequency mask which extracts the target source. Then, we evaluate the separation performance of PA-BSS with those DNNs. As a result, we found that the architecture that estimates noise components using U-Net is superior in terms of separation performance, robustness, and algorithm convergence. ","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告音声言語情報処理(SLP)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2024-02-22","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"42","bibliographicVolumeNumber":"2024-SLP-151"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":232512,"updated":"2025-01-19T10:25:23.004527+00:00","links":{},"created":"2025-01-19T01:33:25.420712+00:00"}