@inproceedings{39dcc739ccfc4bf6aecf9f5ace0a2649,
title = "NWPerf: A system wide performance monitoring tool for large Linux clusters",
abstract = "We present NWPerf, a new system for analyzing fine granularity performance metric data on large-scale supercomputing clusters. This tool is able to measure application efficiency on a system wide basis from both a global system perspective as well as providing a detailed view of individual applications. NWPerf provides this service while minimizing the impact on the performance of user applications. We describe the type of information that can be derived from the system, and demonstrate how the system was used detect and eliminate a performance problem in an application application that improved performance by up to several thousand percent. The NWPerf architecture has proven to be a stable and scalable platform for gathering performance data on a large 1954-CPU production Linux cluster at PNNL",
author = "Ryan Mooney and Schmidt, {Kenneth P.} and Studham, {R. Scott} and Jarek Nieplocha",
note = "Copyright: Copyright 2011 Elsevier B.V., All rights reserved.; 2004 IEEE International Conference on Cluster Computing, ICCC 2004 ; Conference date: 20-09-2004 Through 23-09-2004",
year = "2004",
doi = "10.1109/CLUSTR.2004.1392637",
language = "English (US)",
isbn = "0780386949",
series = "Proceedings - IEEE International Conference on Cluster Computing, ICCC",
pages = "379--389",
booktitle = "2004 IEEE International Conference on Cluster Computing, ICCC 2004",
}