@inproceedings{2a2998e7a46c41898f9bd37b129653b3,
title = "Basic Techniques for Numerical Linear Algebra on Bulk Synchronous Parallel Computers",
abstract = "The bulk synchronous parallel (BSP) model promises scalable and portable software for a wide range of applications. A BSP computer consists of several processors, each with private memory, and a communication network that delivers access to remote memory in uniform time. Numerical linear algebra computations can bene t from the BSP model, both in terms of simplicity and eciency. Dense LU decomposition and other computations can be made more ecient by using the new technique of two-phase randomised broadcasting, which is motivated by a cost analysis in the BSP model. For LU decomposition with partial pivoting, this technique reduces the communication time by a factor of (p p + 1)=3, where p is the number of processors. Theoretical analysis, together with benchmark values for machine parameters, can be used to predict execution time. Such predictions are veri ed by numerical experiments on a 64-processor Cray T3D. The experimental results con rm the advantage of two-phase randomised broadcasting.",
keywords = "Wiskunde en Informatica (WIIN), Mathematics, Wiskunde en computerwetenschappen, Landbouwwetenschappen, Wiskunde: algemeen",
author = "R.H. Bisseling",
note = "First Workshop on Numerical Analysis and Applications, Rousse, Bulgaria 1996",
year = "1997",
doi = "10.1007/3-540-62598-4_78",
language = "English",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "46--57",
editor = "L. Vulkov and J. Wasniewski and P. Yalamov",
booktitle = "Proceedings First Workshop on Numerical Analysis and Applications, Rousse, Bulgaria 1996",
}