@inproceedings{e7e2ad19b2114c54a7608588af1fa8a2,
title = "Linear Systems Solvers for Distributed-Memory Machines with GPU Accelerators",
abstract = "This work presents two implementations of linear solvers for distributed-memory machines with GPU accelerators—one based on the Cholesky factorization and one based on the LU factorization with partial pivoting. The routines are developed as part of the Software for Linear Algebra Targeting Exascale (SLATE) package, which represents a sharp departure from the traditional conventions established by legacy packages, such as LAPACK and ScaLAPACK. The article lays out the principles of the new approach, discusses the implementation details, and presents the performance results.",
keywords = "Cholesky factorization, Distributed memory, GPU acceleration, LU factorization, Linear algebra, Linear systems of equations",
author = "Jakub Kurzak and Mark Gates and Ali Charara and Asim YarKhan and Ichitaro Yamazaki and Jack Dongarra",
note = "Publisher Copyright: {\textcopyright} 2019, Springer Nature Switzerland AG.; 25th International European Conference on Parallel and Distributed Computing, Euro-Par 2019 ; Conference date: 26-08-2019 Through 30-08-2019",
year = "2019",
doi = "10.1007/978-3-030-29400-7_35",
language = "English",
isbn = "9783030293994",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "495--506",
editor = "Ramin Yahyapour",
booktitle = "Euro-Par 2019",
}