@inproceedings{d5bdc2881db74c0a90e301bf5c288973,
title = "Enabling a highly-scalable global address space model for petascale computing",
abstract = "Over the past decade, the trajectory to the petascale has been built on increased complexity and scale of the underlying parallel architectures. Meanwhile, software developers have struggled to provide tools that maintain the productivity of computational science teams using these new systems. In this regard, Global Address Space (GAS) programming models provide a straightforward and easy to use addressing model, which can lead to improved productivity. However, the scalability of GAS depends directly on the design and implementation of the runtime system on the target petascale distributed-memory architecture. In this paper, we describe the design, implementation, and optimization of the Aggregate Remote Memory Copy Interface (ARMCI) runtime library on the Cray XT5 2.3 PetaFLOPs computer at Oak Ridge National Laboratory. We optimized our implementation with the flow intimation technique that we have introduced in this paper. Our optimized ARMCI implementation improves scalability of both the Global Arrays (GA) programming model and a real-world chemistry application - NWChem - from small jobs up through 180,000 cores.",
keywords = "armci, flow control, ga, gas, global address space, global arrays, nwchem, pgas, xt5",
author = "Vinod Tipparaju and Edoardo Apr{\'a} and Weikuan Yu and Vetter, {Jeffrey S.}",
year = "2010",
doi = "10.1145/1787275.1787326",
language = "English",
isbn = "9781450300445",
series = "CF 2010 - Proceedings of the 2010 Computing Frontiers Conference",
pages = "207--216",
booktitle = "CF 2010 - Proceedings of the 2010 Computing Frontiers Conference",
note = "7th ACM International Conference on Computing Frontiers, CF'10 ; Conference date: 17-05-2010 Through 19-05-2010",
}