@InProceedings{Rentrop.Griebel.2020, author = {Lago, Rafael and Obersteiner, Michael and Pollinger, Theresa and Rentrop, Johannes and Bungartz, Hans-Joachim and Dannert, Tilman and Griebel, Michael and Jenko, Frank and Pfl{\"u}ger, Dirk}, editor = {Bungartz, Hans-Joachim and Reiz, Severin and Uekermann, Benjamin and Neumann, Philipp and Nagel, Wolfgang E.}, title = {{EXAHD}: {A} Massively Parallel Fault Tolerant Sparse Grid Approach for High-Dimensional Turbulent Plasma Simulations}, booktitle = {Software for Exascale Computing - SPPEXA 2016-2019}, year = {2020}, publisher = {Springer International Publishing}, address = {Cham}, pages = {301--329}, abstract = {Plasma fusion is one of the promising candidates for an emission-free energy source and is heavily investigated with high-resolution numerical simulations. Unfortunately, these simulations suffer from the curse of dimensionality due to the five-plus-one-dimensional nature of the equations. Hence, we propose a sparse grid approach based on the sparse grid combination technique which splits the simulation grid into multiple smaller grids of varying resolution. This enables us to increase the maximum resolution as well as the parallel efficiency of the current solvers. At the same time we introduce fault tolerance within the algorithmic design and increase the resilience of the application code. We base our implementation on a manager-worker approach which computes multiple solver runs in parallel by distributing tasks to different process groups. Our results demonstrate good convergence for linear fusion runs and show high parallel efficiency up to 180k cores. In addition, our framework achieves accurate results with low overhead in faulty environments. Moreover, for nonlinear fusion runs, we show the effectiveness of the combination technique and discuss existing shortcomings that are still under investigation.}, isbn = {978-3-030-47956-5}, doi = {10.1007/978-3-030-47956-5_11}, note = {Also available as INS Preprint No. 2001.} }