@inproceedings{695d9fcdef9b4966ab9a2cc3f3137a3c,
title = "Tool-assisted optimization of shared-memory accesses in UPC applications",
abstract = "UPC is designed to improve user productivity when programming distributed-memory machines. Yet the shared-memory abstraction also makes performance analysis hard as it introduces extra overhead with local accesses and implicit communication with remote ones. As far as we know, there are no mature software utilities for systematic analysis and tuning of shared-memory access performance in UPC programs. We develop a mechanism to track shared memory accesses and correlate them to the UPC source lines, functions, and data structures. We then apply tool-assisted analysis to a set of UPC programs. For the NAS UPC benchmark we achieve dramatic performance improvement over the unoptimized implementation as well as up to two times speedups over the fully hand-tuned implementation. We expect our approach effective in tuning a wide range of UPC programs.",
keywords = "GAS, UPC, performance toolsGAS, performance toolsP",
author = "Guojing Cong and Huifang Wen and Hiroki Murata and Yasushi Negishi",
year = "2012",
doi = "10.1109/HPCC.2012.24",
language = "English",
isbn = "9780769547497",
series = "Proceedings of the 14th IEEE International Conference on High Performance Computing and Communications, HPCC-2012 - 9th IEEE International Conference on Embedded Software and Systems, ICESS-2012",
pages = "104--111",
booktitle = "Proceedings of the 14th IEEE International Conference on High Performance Computing and Communications, HPCC-2012 - 9th IEEE International Conference on Embedded Software and Systems, ICESS-2012",
note = "14th IEEE International Conference on High Performance Computing and Communications, HPCC-2012 - 9th IEEE International Conference on Embedded Software and Systems, ICESS-2012 ; Conference date: 25-06-2012 Through 27-06-2012",
}