@inproceedings{54deebfe035648629555021365a4782b,
title = "MatRIS: Addressing the Challenges for Portability and Heterogeneity Using Tasking for Matrix Decomposition (Cholesky)",
abstract = "The ubiquitous in-node heterogeneity of HPC and cloud computing platforms makes software portability and performance optimization extremely challenging. Described here, the MatRIS multilevel math library abstraction framework employs tasking to alleviate these difficulties. MatRIS includes the IRIS task-based runtime on the bottom level and exposes different layers of abstraction to render algorithms architecturally agnostic. MatRIS ensures the decomposition and creation of tasks that represent the necessary encapsulation of the optimized kernels from both vendor and open-source math libraries. Once built, MatRIS can select different combinations of accelerators at runtime, making it portable even on diverse heterogeneous architectures. By leveraging the IRIS runtime{\textquoteright}s features for managing heterogeneity, MatRIS deploys algorithms that remove the need to specify orchestration and data transfer. This study describes how the serial task abstraction of a tiled Cholesky factorization is made portable and scalable in the case of multi-device and multi-vendor heterogeneity on a node with NVIDIA and AMD GPUs by using MatRIS. First, we demonstrate that Cholesky in MatRIS provides multi-GPU scalability that offers competitive performance versus cuSolverMG. Then, we present the challenges and opportunities for heterogeneous execution.",
keywords = "Cholesky Decomposition, Heterogeneity, Math Library, Portability, POTRF, Runtime System, Task based programming",
author = "Monil, {Mohammad Alaul Haque} and Miniskar, {Narasinga Rao} and Pedro Valero-Lara and Keita Teranishi and Vetter, {Jeffrey S.}",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2024.; 2nd International Workshop on Asynchronous Many-Task Systems and Applications, WAMTA 2024 ; Conference date: 14-02-2024 Through 16-02-2024",
year = "2024",
doi = "10.1007/978-3-031-61763-8_6",
language = "English",
isbn = "9783031617621",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "59--70",
editor = "Patrick Diehl and Joseph Schuchart and Pedro Valero-Lara and George Bosilca",
booktitle = "Asynchronous Many-Task Systems and Applications - 2nd International Workshop, WAMTA 2024, Proceedings",
}