{"updated":"2025-01-20T07:00:45.528744+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00174119","sets":["1164:2240:8543:8882"]},"path":["8882"],"owner":"11","recid":"174119","title":["学習条件を考慮した大規模非同期ディープラーニングシステムの性能モデリング"],"pubdate":{"attribute_name":"公開日","attribute_value":"2016-08-01"},"_buckets":{"deposit":"25e75085-6531-4c2b-b2dc-b8452b903580"},"_deposit":{"id":"174119","pid":{"type":"depid","value":"174119","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"学習条件を考慮した大規模非同期ディープラーニングシステムの性能モデリング","author_link":["356180","356183","356179","356182","356181","356178"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"学習条件を考慮した大規模非同期ディープラーニングシステムの性能モデリング"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"機械学習","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2016-08-01","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"東京工業大学"},{"subitem_text_value":"東京工業大学"},{"subitem_text_value":"デンソーアイティーラボラトリ"},{"subitem_text_value":"株式会社デンソー"},{"subitem_text_value":"株式会社デンソー"},{"subitem_text_value":"東京工業大学"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/174119/files/IPSJ-HPC16155005.pdf","label":"IPSJ-HPC16155005.pdf"},"date":[{"dateType":"Available","dateValue":"2018-08-01"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-HPC16155005.pdf","filesize":[{"value":"2.4 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"14"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"a0a23c23-5017-44b8-86d5-411d4893b341","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2016 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"大山, 洋介"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"野村, 哲弘"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"佐藤, 育郎"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"西村, 裕紀"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"玉津, 幸政"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"松岡, 聡"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10463942","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8841","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"機械学習による画像認識において Convolutional Neural Network (CNN) と大規模なデータセットを用いた高い認識結果が報告されている.CNN の学習にはミニバッチ Stochastic Gradient Descent (SGD) と呼ばれる最適化手法が広く用いられるが,不適切なミニバッチサイズ下では認識性能が悪化することが知られている.SGD を高速化するために GPU での CNN の計算とパラメータの更新を非同期に行う非同期 SGD が提案されているが,ミニバッチサイズが動的に定まることからノード数等の学習条件の最適値は明らかではない.本論文では非同期 SGD で CNN の学習を行うシステム SPRINT の性能モデルを提案する.この性能モデルは CNN の構造とマシン性能・構成を入力とし,データセット全体を学習に使用する時間と平均ミニバッチサイズを予測する.TSUBAME-KFC/DL の 1~16 ノードを用いた評価では複数の CNN 構造について学習時間と平均ミニバッチサイズの平均予測誤差は 8%以下だった.また,2 つの異なるマシン上である平均ミニバッチサイズの範囲内で学習時間が最短となる学習条件を探索したところ,モデルが予測した順位は実測での順位と一致した.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"9","bibliographic_titles":[{"bibliographic_title":"研究報告ハイパフォーマンスコンピューティング(HPC)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2016-08-01","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"5","bibliographicVolumeNumber":"2016-HPC-155"}]},"relation_version_is_last":true,"weko_creator_id":"11"},"created":"2025-01-19T00:44:21.181742+00:00","id":174119,"links":{}}