{"links":{},"metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00241677","sets":["1164:1579:11464:11813"]},"path":["11813"],"owner":"44499","recid":"241677","title":["Intel AMXを用いた行列積和演算の性能評価"],"pubdate":{"attribute_name":"公開日","attribute_value":"2024-12-09"},"_buckets":{"deposit":"4f1295fa-bf73-426c-bbe2-ed427b93278d"},"_deposit":{"id":"241677","pid":{"type":"depid","value":"241677","revision_id":0},"owners":[44499],"status":"published","created_by":44499},"item_title":"Intel AMXを用いた行列積和演算の性能評価","author_link":["665780","665778","665779"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Intel AMXを用いた行列積和演算の性能評価"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"性能評価","subitem_subject_scheme":"Other"}]},"item_type_id":"4","publish_date":"2024-12-09","item_4_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"九州大学電気情報工学科"},{"subitem_text_value":"九州大学情報基盤研究開発センター"},{"subitem_text_value":"九州大学情報基盤研究開発センター"}]},"item_4_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Department of Electrical Engineering and Computer Science, School of Engineering, Kyushu University","subitem_text_language":"en"},{"subitem_text_value":"Research Institute for Information Technology, Kyushu University","subitem_text_language":"en"},{"subitem_text_value":"Research Institute for Information Technology, Kyushu University","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/241677/files/IPSJ-ARC24259012.pdf","label":"IPSJ-ARC24259012.pdf"},"date":[{"dateType":"Available","dateValue":"2026-12-09"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-ARC24259012.pdf","filesize":[{"value":"1.3 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"16"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"d1a03fa6-749f-47ce-bb49-e3029ddc7281","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2024 by the Information Processing Society of Japan"}]},"item_4_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"遠藤, 悠介"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"大島, 聡史"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"南里, 豪志"}],"nameIdentifiers":[{}]}]},"item_4_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10096105","subitem_source_identifier_type":"NCID"}]},"item_4_textarea_12":{"attribute_name":"Notice","attribute_value_mlt":[{"subitem_textarea_value":"SIG Technical Reports are nonrefereed and hence may later appear in any journals, conferences, symposia, etc."}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_18gh","resourcetype":"technical report"}]},"item_4_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2188-8574","subitem_source_identifier_type":"ISSN"}]},"item_4_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"近年,機械学習や深層学習が盛んになっている中,膨大な計算量を効率よく処理するために,bf16 といった低精度の演算が注目されている.Intel MKL や OpenBLAS といった数値線形代数ライブラリにも低精度の行列積ライブラリが実装されている.さらに計算を効率よく行うために,近年のハードウェアには CPU とは別に行列積計算ユニットが搭載され,これらの性能を最大限に引き出す研究が進められている.Intel Advanced Matrix Extension (AMX) もその 1 つであり,低精度の行列演算に特化したハードウェアアクセラレータである.本研究では,AMX を用いた行列積和演算について,ブロッキングとタイルの操作を最適化して実装し,既存のライブラリと比較して性能評価を行った.その結果,既存のライブラリの最大約 33.5% の計算時間の短縮を達成した.","subitem_description_type":"Other"}]},"item_4_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"15","bibliographic_titles":[{"bibliographic_title":"研究報告システム・アーキテクチャ(ARC)"}],"bibliographicPageStart":"1","bibliographicIssueDates":{"bibliographicIssueDate":"2024-12-09","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"12","bibliographicVolumeNumber":"2024-ARC-259"}]},"relation_version_is_last":true,"weko_creator_id":"44499"},"updated":"2025-01-19T07:34:57.404649+00:00","created":"2025-01-19T01:46:25.354568+00:00","id":241677}