@techreport{oai:ipsj.ixsq.nii.ac.jp:00029319,
 author = {工藤, 誠 and 黒田, 久泰 and 片桐, 孝洋 and 金田, 康正 and Makoto, Kudoh and Hisayasu, Kuroda and Takahiro, Katagiri and Yasumasa, Kanada},
 issue = {22(2001-HPC-089)},
 month = {Mar},
 note = {並列疎行列ベクトル積の性能は行列の構造や計算機の性質に大きく依存するため，これらの性質に合わせた高速化手法で計算することが重要である．本論文では筆者らの作成した複数の高速化手法を含んだ並列疎行列ベクトル積のルーチンを紹介する．また行列や計算機の性質に応じて最適な高速化手法を選択した場合の性能を，従来法である妥当な固定手法を用いた場合の性能と比較する．4機種の並列計算機上での実験では，最適なアルゴリズム選択により平均して1.29倍の速度向上が得られた．, The computational performance of parallel sparse matrix-vector multiplication (SpMxV) depends highly on the non-zero structure of the target matrix and the nature of machine's architecture. Therefore it is important to select the best optimization method according to these characteristics. In this paper, our parallel SpMxV routine which includes several optimization algorithms is described, and the performance with optimal algorithm is compared to that with uniform default algorithm on 4 kinds of parallel machines. The average speed-up of 1.29 is obtained.},
 title = {並列疎行列ベクトル積における最適なアルゴリズム選択の効果},
 year = {2002}
}