@inproceedings{0b6ad201033045feae02d8d646ffa3f7,
title = "Design of scalable software libraries for distributed memory concurrent computers",
abstract = "This paper describes the design of ScaLAPACK, a scalable software library for performing dense and banded linear algebra computations on distributed memory concurrent computers. the specification of the data distribution has important consequences for interprocessor communication and load balance, and hence is a major factor in determining performance and scalability of the library routines. The block cyclic data distribution is adopted as a simple, yet general-purpose, way of decomposing block-partitioned matrices. Distributed memory versions of the Level 3 BLAS provide an easy and convenient way of implementing the ScaLAPACK routines.",
author = "Jaeyoung Choi and Dongarra, {Jack J.} and Walker, {David W.}",
year = "1994",
language = "English",
isbn = "0818656026",
series = "Proceedings of the International Conference on Parallel Processing",
publisher = "Publ by IEEE",
pages = "792--799",
booktitle = "Proceedings of the International Conference on Parallel Processing",
note = "Proceedings of the 8th International Parallel Processing Symposium ; Conference date: 26-04-1994 Through 29-04-1994",
}