@inproceedings{d4f616f2b20d4f41be481139b39abd2f,
title = "GOPipe: A granularity-oblivious programming framework for pipelined stencil executions on GPU",
abstract = "Recent studies have shown promising performance benefits whenmultiple stages of a pipelined stencil application are mapped todifferent parts of a GPU to run concurrently. An important factorfor the computing efficiency of such pipelines is the granularityof a task. In previous programming frameworks that support truepipelined computations on GPU, the choice has to be made bythe programmers during the application development time. Dueto many difficulties, programmers' decisions are often far fromoptimal, causing inferior performance and performance portability.This paper presents GOPipe, a granularity-oblivious programming framework for efficient pipelined stencil executions on GPU.With GOPipe, programmers no longer need to specify the appropriate task granularity. GOPipe automatically finds it, and dynamicallyschedules tasks of that granularity for efficiency while observingall inter-task and inter-stage data dependencies. In our experimentson six real-life applications and various scenarios, GOPipe outperforms the state-of-the-art system by 1.39× on average with a muchbetter programming productivity.",
keywords = "GPU, Optimizations, Programming Framework",
author = "Chanyoung Oh and Zhen Zheng and Xipeng Shen and Jidong Zhai and Youngmin Yi",
note = "Publisher Copyright: {\textcopyright} 2020 Association for Computing Machinery.; 2020 ACM International Conference on Parallel Architectures and Compilation Techniques, PACT 2020 ; Conference date: 03-10-2020 Through 07-10-2020",
year = "2020",
month = sep,
day = "30",
doi = "10.1145/3410463.3414656",
language = "English",
series = "Parallel Architectures and Compilation Techniques - Conference Proceedings, PACT",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "43--54",
booktitle = "PACT 2020 - Proceedings of the ACM International Conference on Parallel Architectures and Compilation Techniques",
address = "United States",
}