@inproceedings{d1f0a79384b74fa6a3632c8b9dabd074,
title = "Decoupled load balancing",
abstract = "Modern scientific simulations divide work between parallel processors by decomposing a spatial domain of mesh cells, particles, or other elements. A balanced assignment of the computational load is critical for parallel performance. If the computation per element changes over the simulation time, simulations can use dynamic load balance algorithms to evenly redistribute work to processes. Graph partitioners are widely used and balance very effectively, but they do not strong scale well. Typical SPMD simulations wait while a load balance algorithm runs on all processors, so a poorly scaling algorithm can itself become a bottleneck. We observe that the load balance algorithm is separate from the main application computation and has its own scaling properties. We propose to decouple the load balance algorithm from the application, and to offload the load balance computation so that it runs concurrently with the application on a smaller number of processors. We demonstrate the costs of decoupling and offloading the load balancing algorithm from a Barnes-Hut application.",
keywords = "Load balance, Parallel algorithm, Performance",
author = "Olga Pearce and Todd Gamblin and {De Supinski}, {Bronis R.} and Martin Schulz and Amato, {Nancy M.}",
year = "2015",
month = jan,
day = "24",
doi = "10.1145/2688500.2688539",
language = "English (US)",
series = "Proceedings of the ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming, PPOPP",
publisher = "Association for Computing Machinery",
pages = "267--268",
booktitle = "20th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming, PPoPP 2015 - Proceedings",
address = "United States",
note = "20th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming, PPoPP 2015 ; Conference date: 07-02-2015 Through 11-02-2015",
}