@inproceedings{b2b6e686ca5e4c5ea87deb3e4149a145,
title = "Inference Benchmarking on HPC Systems",
abstract = "As deep learning on edge computing systems has become more prevalent, investigation of architectures and configurations for optimal inference performance has become a critical step for proposed artificial intelligence solutions. While there has been considerable work in the development of hardware and software for high performance inferencing, there is little known about the performance of such systems on HPC architectures. In this paper, we address outstanding questions on the parallel inference performance on HPC systems. We report results and recommendations derived from evaluating iBench on multiple platforms in a variety of HPC configurations. We systematically benchmark single-GPU performance, single-node performance, and multi-node performance for maximum client-side and server-side inference throughput. In order to achieve linear speedup, we show that concurrent sending clients must be used, as opposed to sending large batch payloads parallelized across multiple GPUs. We show that client/server inferencing architectures add a considerable data transfer component that needs to be taken into consideration when benchmarking HPC system that benchmarks such as MLPerf do not measure. Finally, we investigate energy efficiency of GPUs for different levels of concurrency and batch sizes to report optimal configurations that minimize cost per inference.",
keywords = "GPU, MLPerf, ResNet50, benchmark, distributed, inference",
author = "Wesley Brewer and Greg Behm and Alan Scheinine and Ben Parsons and Wesley Emeneker and Trevino, {Robert P.}",
note = "Publisher Copyright: {\textcopyright} 2020 IEEE.; 2020 IEEE High Performance Extreme Computing Conference, HPEC 2020 ; Conference date: 21-09-2020 Through 25-09-2020",
year = "2020",
month = sep,
day = "22",
doi = "10.1109/HPEC43674.2020.9286138",
language = "English",
series = "2020 IEEE High Performance Extreme Computing Conference, HPEC 2020",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2020 IEEE High Performance Extreme Computing Conference, HPEC 2020",
}