{"updated":"2025-01-20T13:07:40.076365+00:00","links":{},"id":158051,"created":"2025-01-19T00:31:50.325668+00:00","metadata":{"_oai":{"id":"oai:ipsj.ixsq.nii.ac.jp:00158051","sets":["934:1119:8503:8504"]},"path":["8504"],"owner":"11","recid":"158051","title":["演算加速機構を持つクラスタ向けPGAS言語XcalableACCの評価"],"pubdate":{"attribute_name":"公開日","attribute_value":"2016-03-08"},"_buckets":{"deposit":"82814101-dee8-4940-af7c-26d5da5b4dad"},"_deposit":{"id":"158051","pid":{"type":"depid","value":"158051","revision_id":0},"owners":[11],"status":"published","created_by":11},"item_title":"演算加速機構を持つクラスタ向けPGAS言語XcalableACCの評価","author_link":["300869","300873","300875","300874","300876","300872","300868","300867","300870","300871"],"item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"演算加速機構を持つクラスタ向けPGAS言語XcalableACCの評価"},{"subitem_title":"Evaluation of A PGAS Language XcalableACC for Accelerator Clusters","subitem_title_language":"en"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"[コンパイラ] 演算加速機構,GPU,クラスタ,PGAS言語","subitem_subject_scheme":"Other"}]},"item_type_id":"3","publish_date":"2016-03-08","item_3_text_3":{"attribute_name":"著者所属","attribute_value_mlt":[{"subitem_text_value":"筑波大学大学院システム情報工学研究科"},{"subitem_text_value":"国立研究開発法人理化学研究所計算科学研究機構"},{"subitem_text_value":"国立研究開発法人理化学研究所計算科学研究機構"},{"subitem_text_value":"筑波大学大学院システム情報工学研究科/筑波大学計算科学研究センター"},{"subitem_text_value":"筑波大学大学院システム情報工学研究科/国立研究開発法人理化学研究所計算科学研究機構"}]},"item_3_text_4":{"attribute_name":"著者所属(英)","attribute_value_mlt":[{"subitem_text_value":"Graduate School of Systems and Information Engineering, University of Tsukuba","subitem_text_language":"en"},{"subitem_text_value":"RIKEN Advanced Institute for Computational Science","subitem_text_language":"en"},{"subitem_text_value":"RIKEN Advanced Institute for Computational Science","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Systems and Information Engineering, University of Tsukuba / Center for Computational Sciences, University of Tsukuba","subitem_text_language":"en"},{"subitem_text_value":"Graduate School of Systems and Information Engineering, University of Tsukuba / RIKEN Advanced Institute for Computational Science","subitem_text_language":"en"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_publisher":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"情報処理学会","subitem_publisher_language":"ja"}]},"publish_status":"0","weko_shared_id":-1,"item_file_price":{"attribute_name":"Billing file","attribute_type":"file","attribute_value_mlt":[{"url":{"url":"https://ipsj.ixsq.nii.ac.jp/record/158051/files/IPSJ-TACS0901004.pdf","label":"IPSJ-TACS0901004.pdf"},"date":[{"dateType":"Available","dateValue":"2018-03-08"}],"format":"application/pdf","billing":["billing_file"],"filename":"IPSJ-TACS0901004.pdf","filesize":[{"value":"2.9 MB"}],"mimetype":"application/pdf","priceinfo":[{"tax":["include_tax"],"price":"660","billingrole":"5"},{"tax":["include_tax"],"price":"330","billingrole":"6"},{"tax":["include_tax"],"price":"0","billingrole":"16"},{"tax":["include_tax"],"price":"0","billingrole":"11"},{"tax":["include_tax"],"price":"0","billingrole":"14"},{"tax":["include_tax"],"price":"0","billingrole":"15"},{"tax":["include_tax"],"price":"0","billingrole":"44"}],"accessrole":"open_date","version_id":"555c922b-b8a2-45ff-9f76-09503552b3fb","displaytype":"detail","licensetype":"license_note","license_note":"Copyright (c) 2016 by the Information Processing Society of Japan"}]},"item_3_creator_5":{"attribute_name":"著者名","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"田渕, 晶大"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"中尾, 昌広"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"村井, 均"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"朴, 泰祐"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"佐藤, 三久"}],"nameIdentifiers":[{}]}]},"item_3_creator_6":{"attribute_name":"著者名(英)","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Akihiro, Tabuchi","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Masahiro, Nakao","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Hitoshi, Murai","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Taisuke, Boku","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Mitsuhisa, Sato","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_3_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AA11833852","subitem_source_identifier_type":"NCID"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourceuri":"http://purl.org/coar/resource_type/c_6501","resourcetype":"journal article"}]},"item_3_source_id_11":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1882-7829","subitem_source_identifier_type":"ISSN"}]},"item_3_description_7":{"attribute_name":"論文抄録","attribute_value_mlt":[{"subitem_description":"GPUやMICのような演算加速機構を持つクラスタが広く使われている.演算加速機構のプログラミングにOpenACCやOpenMP 4.0を用いてMPIと組み合わせることで,比較的簡易に演算加速機構を持つクラスタ向けのプログラムを記述できるようになったが,それでもなおMPIの記述が煩雑であるため生産性が低いという問題がある.そこで我々はPartitioned Global Address Space(PGAS)言語XcalableMPと演算加速機構プログラミングモデルOpenACCを統合したXcalableACC(XACC)を提案している.XACCでは逐次コードに指示文を追加することにより,演算加速機構を持つクラスタ向けのプログラミングが可能である.本稿では,XACCの通信指示文の一部をNVIDIA GPU向けに実装しベンチマークで性能評価を行った.MPI+OpenACCと比較してHimeno Benchmarkでは最大で97%,NAS Parallel Benchmarks(NPB)CGでは最大で96%の性能を達成した.また指示文による簡潔な記述によりMPI+OpenACCと比較してコード行数をHimeno Benchmarkでは51%,NPB CGでは79%に抑えられたことから,XACCは高い性能と生産性があるといえる.","subitem_description_type":"Other"}]},"item_3_description_8":{"attribute_name":"論文抄録(英)","attribute_value_mlt":[{"subitem_description":"Clusters equipped with accelerators such as GPU and MIC are widely used. For these clusters, programmers can develop their applications relatively easily by combining MPI with OpenACC or OpenMP 4.0, but lower productivity due to complex MPI programming is still a problem. We have been proposing XcalableACC (XACC), which is an integration of a Partitioned Global Address Space (PGAS) language XcalableMP (XMP) and OpenACC. XACC enables programmers to develop applications for accelerator clusters just by adding directives to a serial version of the code. In this paper, we show the implementation of the XACC communication directives for NVIDIA GPU and evaluated their performance using two benchmarks. The performance of the XACC version against MPI+OpenACC version is up to 97% for Himeno Benchmark and up to 96% for NAS Parallel Benchmarks (NPB) CG. The code size of XACC version against MPI+OpenACC version is 51% for Himeno Benchmark and 79% for NPB CG. Therefore, XACC features fully high performance and productivity.","subitem_description_type":"Other"}]},"item_3_biblio_info_10":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicPageEnd":"29","bibliographic_titles":[{"bibliographic_title":"情報処理学会論文誌コンピューティングシステム(ACS)"}],"bibliographicPageStart":"17","bibliographicIssueDates":{"bibliographicIssueDate":"2016-03-08","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"1","bibliographicVolumeNumber":"9"}]},"relation_version_is_last":true,"weko_creator_id":"11"}}