@inproceedings{8a9de336f14640cfb18e9832d21e928b,
title = "Directive-based compilers for GPUs",
abstract = "General Purpose Graphics Computing Units can be effectively used for enhancing the performance of many contemporary scientific applications. However, programming GPUs using machine-specific notations like CUDA or OpenCL can be complex and time consuming. In addition, the resulting programs are typically fine-tuned for a particular target device. A promising alternative is to program in a conventional and machine-independent notation extended with directives and use compilers to generate GPU code automatically. These compilers enable portability and increase programmer productivity and, if effective, would not impose much penalty on performance. This paper evaluates two such compilers, PGI and Cray. We first identify a collection of standard transformations that these compilers can apply. Then, we propose a sequence of manual transformations that programmers can apply to enable the generation of efficient GPU kernels. Lastly, using the Rodinia Benchmark suite, we compare the performance of the code generated by the PGI and Cray compilers with that of code written in CUDA. Our evaluation shows that the code produced by the PGI and Cray compilers can perform well. For 6 of the 15 benchmarks that we evaluated, the compiler generated code achieved over 85% of the performance of a hand-tuned CUDA version.",
keywords = "Accelerator, Cray, Directive-based compiler, Evaluation, GPGPU, OpenACC, PGI",
author = "Swapnil Ghike and Rub{\'e}n Gran and Garzar{\'a}n, {Mar{\'i}a J.} and Padua, {David A.}",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2015.; 27th International Workshop on Languages and Compilers for Parallel Computing, LCPC 2014 ; Conference date: 15-09-2014 Through 17-09-2014",
year = "2015",
doi = "10.1007/978-3-319-17473-0_2",
language = "English (US)",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "19--35",
editor = "James Brodman and Peng Tu",
booktitle = "Languages and Compilers for Parallel Computing - 27th International Workshop, LCPC 2014, Revised Selected Papers",
address = "Germany",
}