@inproceedings{7685dcd74cde4ada96cf325e8cc329a2,
title = "Enhancing Small Message Aggregation with Directive-Based Deferred Execution",
abstract = "The partitioned global address space (PGAS) model offers one-sided communication operations to efficiently access local and remote data through a distributed shared memory model using point-to-point network operations. An extension to the OpenSHMEM PGAS library previously demonstrated how message aggregation could be applied in a minimally intrusive manner to an application, while still achieving a significant portion of the performance possible through manual tuning. However, its primary deficiency was the inability to abstract dependencies between aggregated remote memory accesses and their subsequent uses, which must be managed explicitly by applications. This undermined its goal of preserving algorithmic intent. In this paper, we present a novel directive-based approach for automatically deferring the execution of arbitrary code that depends on aggregated messages, shifting the concern of their efficient management from the application to the implementation. We demonstrate our approach using two applications from the bale 3.0 classic suite on the Frontier supercomputer.",
keywords = "Compilers, Conveyors, Deferred Execution, Message Aggregation, OpenSHMEM",
author = "Aaron Welch and Oscar Hernandez and Stephen Poole and Wendy Poole",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 2024 Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis, SC Workshops 2024 ; Conference date: 17-11-2024 Through 22-11-2024",
year = "2024",
doi = "10.1109/SCW63240.2024.00094",
language = "English",
series = "Proceedings of SC 2024-W: Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "677--681",
booktitle = "Proceedings of SC 2024-W",
}