@inproceedings{b9857537594c479fb0698df90cfae0e6,
title = "Automatic memory optimizations for improving MPI derived datatype performance",
abstract = "MPI derived datatypes allow users to describe noncontiguous memory layout and communicate noncontiguous data with a single communication function. This powerful feature enables an MPI implementation to optimize the transfer of noncontiguous data. In practice, however, many implementations of MPI derived datatypes perform poorly, which makes application developers avoid using this feature. In this paper, we present a technique to automatically select templates that are optimized for memory performance based on the access pattern of derived datatypes. We implement this mechanism in the MPICH2 source code. The performance of our implementation is compared to well-written manual packing/unpacking routines and original MPICH2 implementation. We show that performance for various derived datatypes is significantly improved and comparable to that of optimized manual routines.",
keywords = "Derived datatypes, MPI, MPI performance optimization",
author = "Surendra Byna and Sun, {Xian He} and Rajeev Thakur and William Gropp",
year = "2006",
doi = "10.1007/11846802_36",
language = "English (US)",
isbn = "354039110X",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "238--246",
booktitle = "Recent Advances in Parallel Virtual Machine and Message Passing Interface - 13th European PVM/MPI User's Group Meeting, Proceedings",
address = "Germany",
note = "13th European PVM/MPI User's Group Meeting ; Conference date: 17-09-2006 Through 20-09-2006",
}