@inproceedings{884719ae8dc84a09a80126b3d48f8531,
title = "Design and implementation of a large scale tree-based QR decomposition using a 3D virtual systolic array and a lightweight runtime",
abstract = "A systolic array provides an alternative computing paradigm to the von Neuman architecture. Though its hardware implementation has failed as a paradigm to design integrated circuits in the past, we are now discovering that the systolic array as a software virtualization layer can lead to an extremely scalable execution paradigm. To demonstrate this scalability, in this paper, we design and implement a 3D virtual systolic array to compute a tile QR decomposition of a tall-and-skinny dense matrix. Our implementation is based on a state-of-the-art algorithm that factorizes a panel based on a tree-reduction. Using a runtime developed as a part of the Parallel Ultra Light Systolic Array Runtime (PULSAR) project, we demonstrate on a Cray-XT5 machine how our virtual systolic array can be mapped to a large-scale machine and obtain excellent parallel performance. This is an important contribution since such a QR decomposition is used, for example, to compute a least squares solution of an overdetermined system, which arises in many scientific and engineering problems.",
keywords = "Dataflow, Message-passing, Multithreading, QR decomposition, Runtime, Systolic array",
author = "Ichitaro Yamazaki and Jakub Kurzak and Piotr Luszczek and Jack Dongarra",
note = "Publisher Copyright: {\textcopyright} 2014 IEEE.; 28th IEEE International Parallel and Distributed Processing Symposium Workshops, IPDPSW 2014 ; Conference date: 19-05-2014 Through 23-05-2014",
year = "2014",
month = nov,
day = "27",
doi = "10.1109/IPDPSW.2014.167",
language = "English",
series = "Proceedings - IEEE 28th International Parallel and Distributed Processing Symposium Workshops, IPDPSW 2014",
publisher = "IEEE Computer Society",
pages = "1495--1504",
booktitle = "Proceedings - IEEE 28th International Parallel and Distributed Processing Symposium Workshops, IPDPSW 2014",
}