{"updated":"2025-01-19T12:52:48.296115+00:00","links":{},"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00225217","sets":["1164:2735:11166:11167"]},"path":["11167"],"owner":"44499","recid":"225217","title":["線型モデルから全結合型ニューラルネットワークに対する学習重みの知識転移"],"pubdate":{"attribute_name":"公開日","attribute_value":"2023-03-02"},"_buckets":{"deposit":"37369708-0ea3-4663-99d6-94e98308be8b"},"_deposit":{"id":"225217","pid":{"type":"depid","value":"225217","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"線型モデルから全結合型ニューラルネットワークに対する学習重みの知識転移","author_link":["595533","595532"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"線型モデルから全結合型ニューラルネットワークに対する学習重みの知識転移"},{"subitem_title":"Knowledge Transfer from Linear Model into Fully-connected Neural Network via the Trained weights","subitem_title_language":"en"}]},"item_type_id":"4","publish_date":"2023-03-02","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"産業技術総合研究所人工知能研究センター"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/225217/files/IPSJ-MPS23142032.pdf","label":"IPSJ-MPS23142032.pdf"},"date":[{"dateType":"Available","dateValue":"2025-03-02"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-MPS23142032.pdf","filesize":[{"value":"6.3 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"17"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"fbcdc018-d088-4e33-8315-f2eb38677ab5","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2023 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"鈴木, 藍雅"}],"nameIdentifiers":[{}]}]},"item_4_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Aiga, Suzuki","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10505667","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8833","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"深層学習に用いられるほとんどの深層ニューラルネットワークモデルは，入力されたベクトル信号の Affine 変換によって異なるベクトル信号の中間表現に変換する，全結合層をその伝播規則に持つ．近年では画像認識の分野において Vision Transformer や MLP Mixer などに代表されるような，畳み込みによらず全結合層のみを用いて特徴表現の獲得を行うパッチベースのモデルが台頭していることからも，深層学習の文脈における全結合層の重要度は再び高まりつつある．本研究ではニューラルネットワークにおける全結合層のはたらきと，入力に対する線形変換によって推論を行う種々の線型モデルの間の類似性を元に，学習の容易な線型モデルで得られた重みをニューラルネットワークに転用し，その汎化性能を向上させる枠組みの提案を行う．実験では Affine 変換によるベクトル特徴の縮約モデルと，線型分類モデルを用いてニューラルネットワークの初期重みを決定することでその汎化性能が向上することを示した．","subitem_description_type":"Other"}]},"item_4_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"In deep learning, feed-forward deep neural networks often have an affine layer that maps a vector to another intermediate representation via an affine transformation of the input vector. Recently, in computer vision, convolution-free image recognition models such as Vision Transformer and MLP Mixer have emerged that use only affine transformations to obtain the feature representations of images. Thus, the importance of such fundamental affine layers grown again. This work provides a learning framework that transfers knowledge learned in linear models to affine-based neural networks. The concept is based on the theoretical similarity between the mapping mechanism of linear models and affine layers. In experiments, we demonstrate that the weight initialization from linear dimensionality reduction and linear classification model improves generalization performance of deep neural networks.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"6","bibliographic_titles":[{"bibliographic_title":"研究報告数理モデル化と問題解決（MPS）"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2023-03-02","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"32","bibliographicVolumeNumber":"2023-MPS-142"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"id":225217,"created":"2025-01-19T01:24:43.748399+00:00"}