@inproceedings{e9d2ed11c6d743fab0be86971df6f0a1,
title = "Hierarchical collectives in MPICH2",
abstract = "Most parallel systems on which MPI is used are now hierarchical, such as systems with SMP nodes. Many papers have shown algorithms that exploit shared memory to optimize collective operations to good effect. But how much of the performance benefit comes from tailoring the algorithm to the hierarchical topology of the system? We describe an implementation of many of the MPI collectives based entirely on message-passing primitives that exploits the two-level hierarchy. Our results show that exploiting shared memory directly usually gives small additional benefit and suggests design approaches for where the benefit is large.",
keywords = "Collective Communication, MPI",
author = "Hao Zhu and David Goodell and William Gropp and Rajeev Thakur",
year = "2009",
doi = "10.1007/978-3-642-03770-2_41",
language = "English (US)",
isbn = "3642037690",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "325--326",
booktitle = "Recent Advances in Parallel Virtual Machine and Message Passing Interface - 16th European PVM/MPI Users' Group Meeting, Proceedings",
address = "Germany",
note = "16th European Parallel Virtual Machine and Message Passing Interface Users' Group Meeting, EuroPVM/MPI ; Conference date: 07-09-2009 Through 10-09-2009",
}