@inproceedings{4ca29bb298d14e94b51b5adb7c82ee99,
title = "Characterization of power usage and performance in data-intensive applications sing MapReduce over MPI",
abstract = "This paper presents a quantitative evaluation of the power usage over time in data-intensive applications that use MapReduce over MPI. We leverage the PAPI powercap tool to identify ideal conditions for execution of our mini-applications in terms of (1) dataset characteristics (e.g., unique words in datasets); (2) system characteristics (e.g., KNL and KNM); and (3) implementation of the MapReduce programming model (e.g., impact of various optimizations). Results illustrate the high power utilization and runtime costs of data management on HPC architectures.",
keywords = "Combiner optimizations, Data management, KNL, KNM, PAPI",
author = "Joshua Davis and Tao Gao and Sunita Chandrasekaran and Heike Jagode and Anthony Danalis and Jack Dongarra and Pavan Balaji and Michela Taufer",
note = "Publisher Copyright: {\textcopyright} 2020 The authors and IOS Press.",
year = "2020",
doi = "10.3233/APC200053",
language = "English",
series = "Advances in Parallel Computing",
publisher = "IOS Press BV",
pages = "287--298",
editor = "Ian Foster and Joubert, {Gerhard R.} and Ludek Kucera and Nagel, {Wolfgang E.} and Frans Peters",
booktitle = "Parallel Computing",
}