@inproceedings{d8c924d2a9b0464bbddcc14542f5e6e0,
title = "NUMA-Aware Data-Transfer Measurements for Power/NVLink Multi-GPU Systems",
abstract = "High-performance computing increasingly relies on heterogeneous systems with specialized hardware accelerators to improve application performance. For example, NVIDIA{\textquoteright}s CUDA programming system and general-purpose GPUs have emerged as a widespread accelerator in HPC systems. This trend has exacerbated challenges of data placement as accelerators often have fast local memories to fuel their computational demands, but slower interconnects to feed those memories. Crucially, real-world data-transfer performance is strongly influenced not just by the underlying hardware, but by the capabilities of the programming systems. Understanding how application performance is affected by the logical communication exposed through abstractions, as well as the underlying system topology, is crucial for developing high-performance applications and architectures. This report presents initial data-transfer microbenchmark results from two POWER-based systems obtained during work towards developing an automated system performance characterization tool.",
keywords = "Benchmark, CUDA, GPGPU, NVLink, Unified Memory",
author = "Carl Pearson and Chung, {I. Hsin} and Zehra Sura and Hwu, {Wen Mei} and Jinjun Xiong",
note = "Funding Information: This work is supported by IBM-ILLINOIS Center for Cognitive Computing Systems Research (C3SR) - a research collaboration as part of the IBM Cognitive Horizon Network. This work was supported by the Center for Applications Driving Architectures (ADA), one of six centers of JUMP, a Semiconductor Research Corporation program co-sponsored by DARPA. This research is part of the Blue Waters sustained-petascale computing project, which is supported by the National Science Foundation award OCI-0725070 and the state of Illinois. Blue Waters is a joint effort of the University of Illinois at Urbana-Champaign and its National Center for Supercomputing Applications.; International Conference on High Performance Computing, ISC High Performance 2018 ; Conference date: 28-06-2018 Through 28-06-2018",
year = "2018",
doi = "10.1007/978-3-030-02465-9_32",
language = "English (US)",
isbn = "9783030024642",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer-Verlag Berlin Heidelberg",
pages = "448--454",
editor = "Mich{\`e}le Weiland and Rio Yokota and Sadaf Alam and John Shalf",
booktitle = "High Performance Computing - ISC High Performance 2018 International Workshops, Revised Selected Papers",
}