@article{ART002459855},
author={Gwang Bok Kim and Jong Myon Kim and Cheol Hong Kim},
title={Latency Hiding based Warp Scheduling Policy for High Performance GPUs},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2019},
volume={24},
number={4},
pages={1-9},
doi={10.9708/jksci.2019.24.04.001}
TY - JOUR
AU - Gwang Bok Kim
AU - Jong Myon Kim
AU - Cheol Hong Kim
TI - Latency Hiding based Warp Scheduling Policy for High Performance GPUs
JO - Journal of The Korea Society of Computer and Information
PY - 2019
VL - 24
IS - 4
PB - The Korean Society Of Computer And Information
SP - 1
EP - 9
SN - 1598-849X
AB - LRR(Loose Round Robin) warp scheduling policy for GPU architecture results in high warp-level parallelism and balanced loads across multiple warps. However, traditional LRR policy makes multiple warps execute long latency operations at the same time. In cases that no more warps to be issued under long latency, the throughput of GPUs may be degraded significantly. In this paper, we propose a new warp scheduling policy which utilizes latency hiding, leading to more utilized memory resources in high performance GPUs. The proposed warp scheduler prioritizes memory instruction based on GTO(Greedy Then Oldest) policy in order to provide reduced memory stalls. When no warps can execute memory instruction any more, the warp scheduler selects a warp for computation instruction by round robin manner. Furthermore, our proposed technique achieves high performance by using additional information about recently committed warps. According to our experimental results, our proposed technique improves GPU performance by 12.7% and 5.6% over LRR and GTO on average, respectively.
KW - GPUs;Warp Scheduler;Latency Hiding;Thread Level Parallelism;Data Locality
DO - 10.9708/jksci.2019.24.04.001
ER -
Gwang Bok Kim, Jong Myon Kim and Cheol Hong Kim. (2019). Latency Hiding based Warp Scheduling Policy for High Performance GPUs. Journal of The Korea Society of Computer and Information, 24(4), 1-9.
Gwang Bok Kim, Jong Myon Kim and Cheol Hong Kim. 2019, "Latency Hiding based Warp Scheduling Policy for High Performance GPUs", Journal of The Korea Society of Computer and Information, vol.24, no.4 pp.1-9. Available from: doi:10.9708/jksci.2019.24.04.001
Gwang Bok Kim, Jong Myon Kim, Cheol Hong Kim "Latency Hiding based Warp Scheduling Policy for High Performance GPUs" Journal of The Korea Society of Computer and Information 24.4 pp.1-9 (2019) : 1.
Gwang Bok Kim, Jong Myon Kim, Cheol Hong Kim. Latency Hiding based Warp Scheduling Policy for High Performance GPUs. 2019; 24(4), 1-9. Available from: doi:10.9708/jksci.2019.24.04.001
Gwang Bok Kim, Jong Myon Kim and Cheol Hong Kim. "Latency Hiding based Warp Scheduling Policy for High Performance GPUs" Journal of The Korea Society of Computer and Information 24, no.4 (2019) : 1-9.doi: 10.9708/jksci.2019.24.04.001
Gwang Bok Kim; Jong Myon Kim; Cheol Hong Kim. Latency Hiding based Warp Scheduling Policy for High Performance GPUs. Journal of The Korea Society of Computer and Information, 24(4), 1-9. doi: 10.9708/jksci.2019.24.04.001
Gwang Bok Kim; Jong Myon Kim; Cheol Hong Kim. Latency Hiding based Warp Scheduling Policy for High Performance GPUs. Journal of The Korea Society of Computer and Information. 2019; 24(4) 1-9. doi: 10.9708/jksci.2019.24.04.001
Gwang Bok Kim, Jong Myon Kim, Cheol Hong Kim. Latency Hiding based Warp Scheduling Policy for High Performance GPUs. 2019; 24(4), 1-9. Available from: doi:10.9708/jksci.2019.24.04.001
Gwang Bok Kim, Jong Myon Kim and Cheol Hong Kim. "Latency Hiding based Warp Scheduling Policy for High Performance GPUs" Journal of The Korea Society of Computer and Information 24, no.4 (2019) : 1-9.doi: 10.9708/jksci.2019.24.04.001