@inproceedings{da386a55631d4e0691ae6d50a56e7919,
title = "Nek5000 with OpenACC",
abstract = "Nek5000 is a computational fluid dynamics code based on the spectral element method used for the simulation of incompressible flows. We follow up on an earlier study which ported the simplified version of Nek5000 to a GPU-accelerated system by presenting the hybrid CPU/GPU implementation of the full Nek5000 code using OpenACC. The matrix-matrix multiplication, the Nek5000 gather-scatter operator and a preconditioned Conjugate Gradient solver have implemented using OpenACC for multi-GPU systems.We report an speed-up of 1.3 on single node of a Cray XK6 when using OpenACC directives in Nek5000. On 512 nodes of the Titan supercomputer, the speed-up can be approached to 1.4. A performance analysis of the Nek5000 code using Score-P and Vampir performance monitoring tools shows that overlapping of GPU kernels with host-accelerator memory transfers would considerably increase the performance of the OpenACC version of Nek5000 code.",
keywords = "GPU programming, Nek5000, OpenACC, Spectral element method",
author = "Jing Gong and Stefano Markidis and Michael Schliephake and Erwin Laure and Dan Henningson and Philipp Schlatter and Adam Peplinski and Alistair Hart and Jens Doleschal and David Henty and Paul Fischer",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2015.; International Conference on Exascale Applications and Software, EASC 2014 ; Conference date: 02-04-2014 Through 03-04-2014",
year = "2015",
doi = "10.1007/978-3-319-15976-8_4",
language = "English (US)",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "57--68",
editor = "Stefano Markidis and Erwin Laure",
booktitle = "Solving Software Challenges for Exascale - International Conference on Exascale Applications and Software, EASC 2014, Revised Selected Papers",
address = "Germany",
}