@techreport{oai:ipsj.ixsq.nii.ac.jp:00023287,
 author = {入江, 英嗣 and 高田, 正法 and 坂井, 修一 and Hidetsugu, Irie and Masanori, Takada and Shuichi, Sakai},
 issue = {80(2004-ARC-159)},
 month = {Jul},
 note = {実行コアを複数の実行クラスタへ分割する“クラスタ型アーキテクチャ”は、広い実行幅と高クロック動作の両立を実現する方法として注目されている。クラスタ型アーキテクチャに関する様々な研究が行われている一方で、分散局所化の難しいメモリ参照処理がボトルネックとなることが指摘されている。各クラスタに小容量のD0キャッシュ(以下、D0)を設けるための手法はいくつか検討されているが、曖昧な依存関係や実行遅延予測のため、効果的な構成とすることが難しい。我々は既に、メモリ参照を分散局所化する手法として、メモリ依存予測を利用した“分散投機メモリフォワーディング”を提案している。本論文では、複数D0と分散投機メモリフォワーディングの比較評価を行い、それぞれの有効性を検討する。評価から、実行遅延予測失敗によりペナルティのため、プリミティブな複数D0が有効となるためには、大きなD0容量が必要な事が分かった。一方、分散投機メモリフォワーディングは適用率に限界があるものの、実行遅延予測失敗によるペナルティがないため、クラスタ内に小容量バッファしか利用できない場合に有効であることが分かった。, Clustered Microarchitecture design which partitions its execution core into multiple execution clusters attract attention as the way to achieve wide and fast processing. While there are various studies on Clustered Microarchitectures are done, it is often pointed out that the cache access overheads limit its performance. To overcome this bottleneck, we have proposed the technique "Distributed Speculative Memory Forwarding" which uses memory dependence prediction and localize memory processing.　In this paper, we estimate the proposed technique and the "Replicated Intra Cluster Cache", and compare their efficiency. Simulation results show that the scheduler replay caused by cache misses severely degrades performance of intra cluster cache. On the other hand, proposed technique shows good performance despite small buffer sizes.},
 title = {メモリ依存予測を利用したフォワーディング局所化手法},
 year = {2004}
}