@inproceedings{da386a55631d4e0691ae6d50a56e7919,
title = "Nek5000 with OpenACC",
abstract = "Nek5000 is a computational fluid dynamics code based on the spectral element method used for the simulation of incompressible flows. We follow up on an earlier study which ported the simplified version of Nek5000 to a GPU-accelerated system by presenting the hybrid CPU/GPU implementation of the full Nek5000 code using OpenACC. The matrix-matrix multiplication, the Nek5000 gather-scatter operator and a preconditioned Conjugate Gradient solver have implemented using OpenACC for multi-GPU systems.We report an speed-up of 1.3 on single node of a Cray XK6 when using OpenACC directives in Nek5000. On 512 nodes of the Titan supercomputer, the speed-up can be approached to 1.4. A performance analysis of the Nek5000 code using Score-P and Vampir performance monitoring tools shows that overlapping of GPU kernels with host-accelerator memory transfers would considerably increase the performance of the OpenACC version of Nek5000 code.",
keywords = "GPU programming, Nek5000, OpenACC, Spectral element method",
author = "Jing Gong and Stefano Markidis and Michael Schliephake and Erwin Laure and Dan Henningson and Philipp Schlatter and Adam Peplinski and Alistair Hart and Jens Doleschal and David Henty and Paul Fischer",
note = "This research has received funding from the Swedish e-Science Research Centre (SeRC) and the European Community{\textquoteright}s Seventh Framework Programme (ICT-2011.9.13) under Grant Agreement no. 287703, cresta.eu. We are grateful for the computing time that was made available to us on the Raven system at Cray and on the Titan supercomputer at Oak Ridge National Laboratory within the INCITE program. We would also like to thank Dr. George K. El Khoury for the benchmark used in the paper.; International Conference on Exascale Applications and Software, EASC 2014 ; Conference date: 02-04-2014 Through 03-04-2014",
year = "2015",
doi = "10.1007/978-3-319-15976-8\_4",
language = "English (US)",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "57--68",
editor = "Stefano Markidis and Erwin Laure",
booktitle = "Solving Software Challenges for Exascale - International Conference on Exascale Applications and Software, EASC 2014, Revised Selected Papers",
address = "Germany",
}