@inproceedings{6fc06978dd8244a5851a17fb313269fc,
title = "Improving processor availability in the MPI implementation for the ASCI/Red supercomputer",
abstract = "This paper describes how a portable benchmark suite that measures the ability of an MPI implementation to overlap computation and communication can be used to discover and diagnose performance problems. We describe the approach of the benchmark suite and discuss a performance problem that we uncovered with the MPI implementation on the ASCI/Red supercomputer. A slight modification to the MPI implementation has resulted in a significant gain in CPU availability and bandwidth with a slight degradation in latency performance. We present a detailed analysis of these results and discuss how the benchmark suite has enabled us to tailor the MPI implementation to optimize for all three measurements.",
keywords = "Availability, Bandwidth, Computer networks, Computer science, Contracts, Degradation, Laboratories, Performance gain, Portable computers, Supercomputers",
author = "R. Brightwell and W. Lawry and Maccabe, \{A. B.\} and C. Wilson",
note = "Publisher Copyright: {\textcopyright} 2002 IEEE.; 27th Annual IEEE Conference on Local Computer Networks, LCN 2002 ; Conference date: 06-11-2002 Through 08-11-2002",
year = "2002",
doi = "10.1109/LCN.2002.1181841",
language = "English (US)",
series = "Proceedings - Conference on Local Computer Networks, LCN",
publisher = "IEEE Computer Society",
pages = "639--647",
booktitle = "Proceedings - LCN 2002",
}