@inproceedings{7fd33cb26ed345508a9bfd9f026170e7,
title = "The impact of multicore on math software and exploiting single precision computing to obtain double precision results",
abstract = "Recent versions of microprocessors exhibit performance characteristics for 32 bit floating point arithmetic (single precision) that is substantially higher than 64 bit floating point arithmetic (double precision). Examples include the Intel Pentium IV and M processors, AMD Opteron architectures, the IBM Cell processor and various GPUs. When working in single precision, floating point operations can be performed up to two times faster on the Pentium and up to ten times faster on the Cell over double precision. The motivation for this work is to exploit single precision operations whenever possible and resort to double precision at critical stages while attempting to provide the full double precision results. The results described here are fairly general and can be applied to various problems in linear algebra such as solving large sparse systems, using direct or iterative methods and some eigenvalue problems. There are limitations to the success of this process, such as when the conditioning of the problem exceeds the reciprocal of the accuracy of the single precision computations. In that case the double precision algorithm should be used.",
author = "Jack Dongarra",
note = "Publisher Copyright: {\textcopyright} Springer-Verlag Berlin Heidelberg 2006.; 4th International Symposium on Parallel and Distributed Processing and Applications, ISPA 2006 ; Conference date: 04-12-2006 Through 06-12-2006",
year = "2006",
doi = "10.1007/11946441_2",
language = "English",
isbn = "9783540680673",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "2",
editor = "Minyi Guo and Yang, {Laurence T} and {Di Martino}, Beniamino and Zima, {Hans P.} and Zima, {Hans P.} and Jack Dongarra and Feilong Tang",
booktitle = "Parallel and Distributed Processing and Applications - 4th International Symposium, ISPA 2006, Proceedings",
}