@inproceedings{0c0824a3c72045ab8d14447bbf09ee47,
title = "Tile QR factorization with parallel panel processing for multicore architectures",
abstract = "To exploit the potential of multicore architectures, recent dense linear algebra libraries have used tile algorithms, which consist in scheduling a Directed Acyclic Graph (DAG) of tasks of fine granularity where nodes represent tasks, either panel factorization or update of a block-column, and edges represent dependencies among them. Although past approaches already achieve high performance on moderate and large square matrices, their way of processing a panel in sequence leads to limited performance when factorizing tall and skinny matrices or small square matrices. We present a new fully asynchronous method for computing a QR factorization on shared-memory multicore architectures that overcomes this bottleneck. Our contribution is to adapt an existing algorithm that performs a panel factorization in parallel (named Communication-Avoiding QR and initially designed for distributed-memory machines), to the context of tile algorithms using asynchronous computations. An experimental study shows significant improvement (up to almost 10 times faster) compared to state-of-the-art approaches. We aim to eventually incorporate this work into the Parallel Linear Algebra for Scalable Multi-core Architectures (PLASMA) library.",
keywords = "Communication avoiding, Dynamic scheduling, Multicore, QR factorization, Tile algorithms",
author = "Bilel Hadri and Hatem Ltaief and Emmanuel Agullo and Jack Dongarra",
year = "2010",
doi = "10.1109/IPDPS.2010.5470443",
language = "English (US)",
isbn = "9781424464432",
series = "Proceedings of the 2010 IEEE International Symposium on Parallel and Distributed Processing, IPDPS 2010",
booktitle = "Proceedings of the 2010 IEEE International Symposium on Parallel and Distributed Processing, IPDPS 2010",
note = "24th IEEE International Parallel and Distributed Processing Symposium, IPDPS 2010 ; Conference date: 19-04-2010 Through 23-04-2010",
}