@inproceedings{oai:ipsj.ixsq.nii.ac.jp:00082199,
 author = {道浦, 悌 and 大野, 和彦 and 松本, 真樹 and 佐々木, 敬泰 and 近藤, 利夫 and Dai, Michiura and Kazuhiko, Ohno and Masaki, Matsumoto and Takahiro, Sasaki and Toshio, Kondo},
 book = {先進的計算基盤システムシンポジウム論文集},
 month = {May},
 note = {近年，GPU上で汎用計算を実行するGPGPUが注目されている．また，CUDAやOpenCLなどの開発環境がリリースされ，GPUプログラミングは容易になりつつある．しかし，これらの環境では，ホストメモリ・デバイスメモリ間のデータ転送をプログラマが明示的に記述する必要がある．そこで，我々はデータ転送を自動化するフレームワークMESI-CUDAを提案している．本論文では，MESI-CUDAのプログラミングモデルを示し，データ転送とカーネル処理のオーバラップ実現のためのデータフロー解析とストリーム割り当て手法を述べる．MESI-CUDAの性能を示すために，手動で最適化したCUDAプログラムとMESI-CUDAの出力プログラムで実行時間を比較して，評価を行った．その結果，実行時間にほとんど差が無く，ほぼ最適に近いコードを得ることができた．, The performance of Graphics Processing Units (GPU) is improving rapidly. Thus, General Purpose computation on Graphics Processing Units (GPGPU) is expected as an important method for high-performance computing. Although programming frameworks, such as CUDA and OpenCL, are provided, they require explicit specification of memory allocations and data transfers. Therefore, we are developing a new programming framework MESI-CUDA, which hides such low-level description from the user. In this paper, we present the programming model of MESI-CUDA and show the detail of data flow analysis and stream allocation to overlap data transfers and kernel executions. The evaluation result shows that the performance of MESI-CUDA programs is close to hand-optimized CUDA programs, nevertheless the data transfer code is automatically generated and optimized.},
 pages = {201--209},
 publisher = {情報処理学会},
 title = {GPGPUにおけるデータ転送を自動化するMESI-CUDAの提案},
 volume = {2012},
 year = {2012}
}