@inproceedings{d0640ce1d74f48949423c93d942ef015,
title = "Scalability of partial differential equations preconditioner resilient to soft and hard faults",
abstract = "We present a resilient domain-decomposition preconditioner for partial differential equations (PDEs). The algorithm reformulates the PDE as a sampling problem, followed by a solution update through data manipulation that is resilient to both soft and hard faults. We discuss an implementation based on a server-client model where all state information is held by the servers, while clients are designed solely as computational units. Servers are assumed to be “sandboxed”, while no assumption is made on the reliability of the clients. We explore the scalability of the algorithm up to ∼12k cores, build an SST/macro skeleton to extrapolate to∼50k cores, and show the resilience under simulated hard and soft faults for a 2D linear Poisson equation.",
author = "Karla Morris and Francesco Rizzi and Khachik Sargsyan and Kathryn Dahlgren and Paul Mycek and Cosmin Safta and {Le Ma{\^i}tre}, Olivier and Omar Knio and Bert Debusschere",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2016.; 31st International Conference on High Performance Computing, ISC High Performance 2016 ; Conference date: 19-06-2016 Through 23-06-2016",
year = "2016",
doi = "10.1007/978-3-319-41321-1_24",
language = "English (US)",
isbn = "9783319413204",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "469--485",
editor = "Jack Dongarra and Kunkel, {Julian M.} and Pavan Balaji",
booktitle = "High Performance Computing - 31st International Conference, ISC High Performance 2016, Proceedings",
address = "Germany",
}