references.bib



@article{trahay_exa-soft_nodate,
	title = {Exa-{SofT} – performance analysis},
	language = {en},
	author = {Trahay, François},
}

@misc{cardosi_specx_2023,
	title = {Specx: a {C}++ task-based runtime system for heterogeneous distributed architectures},
	copyright = {Creative Commons Attribution 4.0 International},
	shorttitle = {Specx},
	url = {https://arxiv.org/abs/2308.15964},
	doi = {10.48550/ARXIV.2308.15964},
	abstract = {Parallelization is needed everywhere, from laptops and mobile phones to supercomputers. Among parallel programming models, task-based programming has demonstrated a powerful potential and is widely used in high-performance scientific computing. Not only does it allow for efficient parallelization across distributed heterogeneous computing nodes, but it also allows for elegant source code structuring by describing hardware-independent algorithms. In this paper, we present Specx, a task-based runtime system written in modern C++. Specx supports distributed heterogeneous computing by simultaneously exploiting CPUs and GPUs (CUDA/HIP) and incorporating communication into the task graph. We describe the specificities of Specx and demonstrate its potential by running parallel applications.},
	urldate = {2024-10-15},
	publisher = {arXiv},
	author = {Cardosi, Paul and Bramas, Bérenger},
	year = {2023},
	note = {Version Number: 1},
	keywords = {Distributed, Parallel, and Cluster Computing (cs.DC), FOS: Computer and information sciences, Software Engineering (cs.SE)},
}

@misc{Palazollo_Feel_Shape_Optimization,
	title = {Feel++ shape optimization toolbox},
	copyright = {LGPL-3.0-or-later},
	url = {https://github.com/feelpp/feelpp-shapo},
	author = {Palazollo, Lucas and Prud'homme, Christophe},
	year = {2024},
}

@book{britain_standard_1990,
	title = {The {Standard} {NAFEMS} {Benchmarks}},
	publisher = {NAFEMS},
	author = {Britain), National Agency for Finite Element Methods \& Standards (Great},
	year = {1990},
}

@article{nguessan_high_2021,
	series = {Numerical {Solution} of {Differential} and {Differential}-{Algebraic} {Equations}. {Selected} {Papers} from {NUMDIFF}-15},
	title = {High order time integration and mesh adaptation with error control for incompressible {Navier}–{Stokes} and scalar transport resolution on dual grids},
	volume = {387},
	issn = {0377-0427},
	url = {https://www.sciencedirect.com/science/article/pii/S0377042719305473},
	doi = {10.1016/j.cam.2019.112542},
	abstract = {Relying on a building block developed by the authors in order to resolve the incompressible Navier–Stokes equation with high order implicit time stepping and dynamic mesh adaptation based on multiresolution analysis with collocated variables, the present contribution investigates the ability to extend such a strategy for scalar transport at relatively large Schmidt numbers using a finer level of refinement compared to the resolution of the hydrodynamic variables, while preserving space adaptation with error control. This building block is a key part of a strategy to construct a low-Mach number code based on a splitting strategy for combustion applications, where several spatial scales are into play. The computational efficiency and accuracy of the proposed strategy is assessed on a well-chosen three-vortex simulation.},
	urldate = {2024-10-15},
	journal = {Journal of Computational and Applied Mathematics},
	author = {N’Guessan, Marc-Arthur and Massot, Marc and Séries, Laurent and Tenaud, Christian},
	month = may,
	year = {2021},
	keywords = {Dual grid with error control, Dynamic mesh adaptation, High order implicit Runge Kutta, Incompressible Navier–Stokes, Multiresolution analysis, Scalar transport},
	pages = {112542},
}

@article{lecointre_hydrogen_nodate,
	title = {Hydrogen flame acceleration in non-uniform mixtures},
	abstract = {This thesis, carried out with the support of the CEA, presents the development of numerical methods dedicated to the simulation of the acceleration process of a hydrogen ﬂame.},
	language = {fr},
	author = {Lecointre, Luc},
}

@article{duarte_adaptive_nodate,
	title = {Adaptive numerical methods in time and space for the simulation of multi-scale reaction fronts.},
	language = {fr},
	author = {Duarte, Max Pedro},
}

@article{helbecque_parallel_2023,
	title = {Parallel distributed productivity‐aware tree‐search using {Chapel}},
	volume = {35},
	issn = {1532-0626, 1532-0634},
	url = {https://onlinelibrary.wiley.com/doi/10.1002/cpe.7874},
	doi = {10.1002/cpe.7874},
	abstract = {Abstract
            
              With the recent arrival of the exascale era, modern supercomputers are increasingly big making their programming much more complex. In addition to performance, software productivity is a major concern to choose a programming language, such as Chapel, designed for exascale computing. In this paper, we investigate the design of a parallel distributed tree‐search algorithm, namely P3D‐DFS, and its implementation using Chapel. The design is based on the Chapel's
              DistBag
              data structure, revisited by: (1) redefining the data structure for Depth‐First tree‐Search (DFS), henceforth renamed
              DistBag‐DFS
              ; (2) redesigning the underlying load balancing mechanism. In addition, we propose two instantiations of P3D‐DFS considering the Branch‐and‐Bound (B\&B) and Unbalanced Tree Search (UTS) algorithms. In order to evaluate how much performance is traded for productivity, we compare the Chapel‐based implementations of B\&B and UTS to their best‐known counterparts based on traditional OpenMP (intra‐node) and MPI+X (inter‐node). For experimental validation using 4096 processing cores, we consider the permutation flow‐shop scheduling problem for B\&B and synthetic literature benchmarks for UTS. The reported results show that P3D‐DFS competes with its OpenMP baselines for coarser‐grained shared‐memory scenarios, and with its MPI+X counterparts for distributed‐memory settings, considering both performance and productivity‐awareness. In the context of this work, this makes Chapel an alternative to OpenMP/MPI+X for exascale programming.},
	language = {en},
	number = {27},
	urldate = {2024-10-15},
	journal = {Concurrency and Computation: Practice and Experience},
	author = {Helbecque, Guillaume and Gmys, Jan and Melab, Nouredine and Carneiro, Tiago and Bouvry, Pascal},
	month = dec,
	year = {2023},
	pages = {e7874},
}

@incollection{franco_pgas_2024,
	address = {Cham},
	title = {{PGAS} {Data} {Structure} for {Unbalanced} {Tree}-{Based} {Algorithms} at {Scale}},
	volume = {14834},
	isbn = {978-3-031-63758-2 978-3-031-63759-9},
	url = {https://link.springer.com/10.1007/978-3-031-63759-9_13},
	language = {en},
	urldate = {2024-10-15},
	booktitle = {Computational {Science} – {ICCS} 2024},
	publisher = {Springer Nature Switzerland},
	author = {Helbecque, Guillaume and Carneiro, Tiago and Melab, Nouredine and Gmys, Jan and Bouvry, Pascal},
	editor = {Franco, Leonardo and De Mulatier, Clélia and Paszynski, Maciej and Krzhizhanovskaya, Valeria V. and Dongarra, Jack J. and Sloot, Peter M. A.},
	year = {2024},
	doi = {10.1007/978-3-031-63759-9_13},
	note = {Series Title: Lecture Notes in Computer Science},
	pages = {103--111},
}

@article{gmys_exactly_2022,
	title = {Exactly {Solving} {Hard} {Permutation} {Flowshop} {Scheduling} {Problems} on {Peta}-{Scale} {GPU}-{Accelerated} {Supercomputers}},
	volume = {34},
	issn = {1091-9856, 1526-5528},
	url = {https://pubsonline.informs.org/doi/10.1287/ijoc.2022.1193},
	doi = {10.1287/ijoc.2022.1193},
	abstract = {Makespan minimization in permutation flow-shop scheduling is a well-known hard combinatorial optimization problem. Among the 120 standard benchmark instances proposed by E. Taillard in 1993, 23 have remained unsolved for almost three decades. In this paper, we present our attempts to solve these instances to optimality using parallel Branch-and-Bound (BB) on the GPU-accelerated Jean Zay supercomputer. We report the exact solution of 11 previously unsolved problem instances and improved upper bounds for eight instances. The solution of these problems requires both algorithmic improvements and leveraging the computing power of peta-scale high-performance computing platforms. The challenge consists in efficiently performing parallel depth-first traversal of a highly irregular and fine-grained search tree on distributed systems composed of hundreds of massively parallel accelerator devices and multicore processors. We present and discuss the design and implementation of our permutation-based BB and experimentally evaluate its parallel performance on up to 384 V100 GPUs (2 million CUDA cores) and 3840 CPU cores. The optimality proof for the largest solved instance requires about 64 CPU-years of computation—using 256 GPUs and over 4 million parallel search agents, the traversal of the search tree is completed in 13 hours, exploring [Formula: see text] nodes.},
	language = {en},
	number = {5},
	urldate = {2024-10-15},
	journal = {INFORMS Journal on Computing},
	author = {Gmys, Jan},
	month = sep,
	year = {2022},
	pages = {2502--2522},
}

@article{delorme_novel_nodate,
	title = {{NOVEL} {NUMERICAL} {METHODS} {FOR} {SOLAR} {CONVECTION}: {THE} {DYABLO} {WHOLE}-{SUN} {ADAPTATIVE} {MESH} {REFINEMENT} {CODE}},
	abstract = {We present a new solar simulation code named Dyablo Whole-Sun (DWS) and the ﬁrst steps of its validation. DWS is a novel portable high-performance code aiming at making the ﬁrst holistic simulations of the Sun, from the radiative interior to the corona. We discuss the validation of the development of the code using a solar convection benchmark in Cartesian geometry.},
	language = {en},
	author = {Delorme, M and Durocher, A and Brun, A S and Strugarek, A},
}

@article{dubey_survey_2014,
	series = {Domain-{Specific} {Languages} and {High}-{Level} {Frameworks} for {High}-{Performance} {Computing}},
	title = {A survey of high level frameworks in block-structured adaptive mesh refinement packages},
	volume = {74},
	issn = {0743-7315},
	url = {https://www.sciencedirect.com/science/article/pii/S0743731514001178},
	doi = {10.1016/j.jpdc.2014.07.001},
	abstract = {Over the last decade block-structured adaptive mesh refinement (SAMR) has found increasing use in large, publicly available codes and frameworks. SAMR frameworks have evolved along different paths. Some have stayed focused on specific domain areas, others have pursued a more general functionality, providing the building blocks for a larger variety of applications. In this survey paper we examine a representative set of SAMR packages and SAMR-based codes that have been in existence for half a decade or more, have a reasonably sized and active user base outside of their home institutions, and are publicly available. The set consists of a mix of SAMR packages and application codes that cover a broad range of scientific domains. We look at their high-level frameworks, their design trade-offs and their approach to dealing with the advent of radical changes in hardware architecture. The codes included in this survey are BoxLib, Cactus, Chombo, Enzo, FLASH, and Uintah.},
	number = {12},
	urldate = {2024-10-14},
	journal = {Journal of Parallel and Distributed Computing},
	author = {Dubey, Anshu and Almgren, Ann and Bell, John and Berzins, Martin and Brandt, Steve and Bryan, Greg and Colella, Phillip and Graves, Daniel and Lijewski, Michael and Löffler, Frank and O’Shea, Brian and Schnetter, Erik and Van Straalen, Brian and Weide, Klaus},
	month = dec,
	year = {2014},
	keywords = {BoxLib, Cactus, Chombo, Enzo, FLASH, SAMR, Uintah},
	pages = {3217--3227},
}

@article{dubey_survey_2014-1,
	series = {Domain-{Specific} {Languages} and {High}-{Level} {Frameworks} for {High}-{Performance} {Computing}},
	title = {A survey of high level frameworks in block-structured adaptive mesh refinement packages},
	volume = {74},
	issn = {0743-7315},
	url = {https://www.sciencedirect.com/science/article/pii/S0743731514001178},
	doi = {10.1016/j.jpdc.2014.07.001},
	abstract = {Over the last decade block-structured adaptive mesh refinement (SAMR) has found increasing use in large, publicly available codes and frameworks. SAMR frameworks have evolved along different paths. Some have stayed focused on specific domain areas, others have pursued a more general functionality, providing the building blocks for a larger variety of applications. In this survey paper we examine a representative set of SAMR packages and SAMR-based codes that have been in existence for half a decade or more, have a reasonably sized and active user base outside of their home institutions, and are publicly available. The set consists of a mix of SAMR packages and application codes that cover a broad range of scientific domains. We look at their high-level frameworks, their design trade-offs and their approach to dealing with the advent of radical changes in hardware architecture. The codes included in this survey are BoxLib, Cactus, Chombo, Enzo, FLASH, and Uintah.},
	number = {12},
	urldate = {2024-10-14},
	journal = {Journal of Parallel and Distributed Computing},
	author = {Dubey, Anshu and Almgren, Ann and Bell, John and Berzins, Martin and Brandt, Steve and Bryan, Greg and Colella, Phillip and Graves, Daniel and Lijewski, Michael and Löffler, Frank and O’Shea, Brian and Schnetter, Erik and Van Straalen, Brian and Weide, Klaus},
	month = dec,
	year = {2014},
	keywords = {BoxLib, Cactus, Chombo, Enzo, FLASH, SAMR, Uintah},
	pages = {3217--3227},
}

@article{cohen_fully_2003,
	title = {Fully adaptive multiresolution finite volume schemes for conservation laws},
	volume = {72},
	issn = {0025-5718, 1088-6842},
	url = {https://www.ams.org/mcom/2003-72-241/S0025-5718-01-01391-6/},
	doi = {10.1090/S0025-5718-01-01391-6},
	abstract = {Advancing research. Creating connections.},
	language = {English},
	number = {241},
	urldate = {2024-10-14},
	journal = {Mathematics of Computation},
	author = {Cohen, Albert and Kaber, Sidi and Müller, Siegfried and Postel, Marie},
	year = {2003},
	keywords = {Conservation laws, adaptivity, finite volume schemes, multiresolution, wavelets.},
	pages = {183--225},
}

@article{krah_wavelet_2022,
	title = {Wavelet adaptive proper orthogonal decomposition for large-scale flow data},
	volume = {48},
	issn = {1572-9044},
	url = {https://doi.org/10.1007/s10444-021-09922-2},
	doi = {10.1007/s10444-021-09922-2},
	abstract = {The proper orthogonal decomposition (POD) is a powerful classical tool in fluid mechanics used, for instance, for model reduction and extraction of coherent flow features. However, its applicability to high-resolution data, as produced by three-dimensional direct numerical simulations, is limited owing to its computational complexity. Here, we propose a wavelet-based adaptive version of the POD (the wPOD), in order to overcome this limitation. The amount of data to be analyzed is reduced by compressing them using biorthogonal wavelets, yielding a sparse representation while conveniently providing control of the compression error. Numerical analysis shows how the distinct error contributions of wavelet compression and POD truncation can be balanced under certain assumptions, allowing us to efficiently process high-resolution data from three-dimensional simulations of flow problems. Using a synthetic academic test case, we compare our algorithm with the randomized singular value decomposition. Furthermore, we demonstrate the ability of our method analyzing data of a two-dimensional wake flow and a three-dimensional flow generated by a flapping insect computed with direct numerical simulation.},
	language = {en},
	number = {2},
	urldate = {2024-10-14},
	journal = {Advances in Computational Mathematics},
	author = {Krah, Philipp and Engels, Thomas and Schneider, Kai and Reiss, Julius},
	month = feb,
	year = {2022},
	keywords = {Biorthogonal wavelets, Fluid dynamics, Proper orthogonal decomposition, Reduced order models, Wavelet adaptive block-based grids},
	pages = {10},
}

@article{gillis_murphy---scalable_2022,
	title = {{MURPHY}---{A} {Scalable} {Multiresolution} {Framework} for {Scientific} {Computing} on {3D} {Block}-{Structured} {Collocated} {Grids}},
	volume = {44},
	issn = {1064-8275},
	url = {https://epubs.siam.org/doi/abs/10.1137/21M141676X},
	doi = {10.1137/21M141676X},
	abstract = {We present the lifting scheme, a simple construction of second generation wavelets; these are wavelets that are not necessarily translates and dilates of one fixed function. Such wavelets can be adapted to intervals, domains, surfaces, weights, and irregular samples. We show how the lifting scheme leads to a faster, in-place calculation of the wavelet transform. Several examples are included.},
	number = {5},
	urldate = {2024-10-14},
	journal = {SIAM Journal on Scientific Computing},
	author = {Gillis, Thomas and van Rees, Wim M.},
	month = oct,
	year = {2022},
	note = {Publisher: Society for Industrial and Applied Mathematics},
	pages = {C367--C398},
}

@article{zhang_amrex_2021,
	title = {{AMReX}: {Block}-structured adaptive mesh refinement for multiphysics applications},
	volume = {35},
	issn = {1094-3420},
	shorttitle = {{AMReX}},
	url = {https://doi.org/10.1177/10943420211022811},
	doi = {10.1177/10943420211022811},
	abstract = {Block-structured adaptive mesh refinement (AMR) provides the basis for the temporal and spatial discretization strategy for a number of Exascale Computing Project applications in the areas of accelerator design, additive manufacturing, astrophysics, combustion, cosmology, multiphase flow, and wind plant modeling. AMReX is a software framework that provides a unified infrastructure with the functionality needed for these and other AMR applications to be able to effectively and efficiently utilize machines from laptops to exascale architectures. AMR reduces the computational cost and memory footprint compared to a uniform mesh while preserving accurate descriptions of different physical processes in complex multiphysics algorithms. AMReX supports algorithms that solve systems of partial differential equations in simple or complex geometries and those that use particles and/or particle–mesh operations to represent component physical processes. In this article, we will discuss the core elements of the AMReX framework such as data containers and iterators as well as several specialized operations to meet the needs of the application projects. In addition, we will highlight the strategy that the AMReX team is pursuing to achieve highly performant code across a range of accelerator-based architectures for a variety of different applications.},
	language = {en},
	number = {6},
	urldate = {2024-10-14},
	journal = {The International Journal of High Performance Computing Applications},
	author = {Zhang, Weiqun and Myers, Andrew and Gott, Kevin and Almgren, Ann and Bell, John},
	month = nov,
	year = {2021},
	note = {Publisher: SAGE Publications Ltd STM},
	pages = {508--526},
}

@article{burstedde_p4est_2011,
	title = {p4est: {Scalable} {Algorithms} for {Parallel} {Adaptive} {Mesh} {Refinement} on {Forests} of {Octrees}},
	volume = {33},
	issn = {1064-8275},
	shorttitle = {p4est},
	url = {https://epubs.siam.org/doi/abs/10.1137/100791634},
	doi = {10.1137/100791634},
	abstract = {In this article, we propose new parallel algorithms for the construction and 2:1 balance refinement of large linear octrees on distributed memory machines. Such octrees are used in many problems in computational science and engineering, e.g., object representation, image analysis, unstructured meshing, finite elements, adaptive mesh refinement, and N-body simulations. Fixed-size scalability and isogranular analysis of the algorithms using an MPI-based parallel implementation was performed on a variety of input data and demonstrated good scalability for different processor counts (1 to 1024 processors) on the Pittsburgh Supercomputing Center's TCS-1 AlphaServer. The results are consistent for different data distributions. Octrees with over a billion octants were constructed and balanced in less than a minute on 1024 processors. Like other existing algorithms for constructing and balancing octrees, our algorithms have \${\textbackslash}mathcal\{O\}(N{\textbackslash}log N)\$ work and \${\textbackslash}mathcal\{O\}(N)\$ storage complexity. Under reasonable assumptions on the distribution of octants and the work per octant, the parallel time complexity is \${\textbackslash}mathcal\{O\}({\textbackslash}frac\{N\}\{n\_p\}{\textbackslash}log({\textbackslash}frac\{N\}\{n\_p\})+n\_p{\textbackslash}log n\_p)\$, where N is the size of the final linear octree and \$n\_p\$ is the number of processors.},
	number = {3},
	urldate = {2024-10-14},
	journal = {SIAM Journal on Scientific Computing},
	author = {Burstedde, Carsten and Wilcox, Lucas C. and Ghattas, Omar},
	month = jan,
	year = {2011},
	note = {Publisher: Society for Industrial and Applied Mathematics},
	pages = {1103--1133},
}

@article{bellotti_numerical_nodate,
	title = {Numerical analysis of lattice {Boltzmann} schemes: from fundamental issues to efficient and accurate adaptive methods},
	language = {en},
	author = {Bellotti, Thomas},
}

@article{bellotti_multiresolution-based_2022,
	title = {Multiresolution-{Based} {Mesh} {Adaptation} and {Error} {Control} for {Lattice} {Boltzmann} {Methods} with {Applications} to {Hyperbolic} {Conservation} {Laws}},
	volume = {44},
	issn = {1064-8275},
	url = {https://epubs.siam.org/doi/abs/10.1137/21M140256X},
	doi = {10.1137/21M140256X},
	abstract = {Lattice Boltzmann methods (LBM) stand out for their simplicity and computational efficiency while offering the possibility of simulating complex phenomena. While they are optimal for Cartesian meshes, adapted meshes have traditionally been a stumbling block since it is difficult to predict the right physics through various levels of meshes. In this work, we design a class of fully adaptive LBM methods with dynamic mesh adaptation and error control relying on multiresolution analysis. This wavelet-based approach allows us to adapt the mesh based on the regularity of the solution and leads to a very efficient compression of the solution without loosing its quality and with the preservation of the properties of the original LBM method on the finest grid. This yields a general approach for a large spectrum of schemes and allows precise error bounds, without the need for deep modifications on the reference scheme. An error analysis is proposed. For the purpose of validating this error analysis, we conduct a series of test cases for various schemes and scalar and systems of conservation laws, where solutions with shocks are to be found and local mesh adaptation is especially relevant. Theoretical estimates are retrieved while a reduced memory footprint is observed. It paves the way to an implementation in a multidimensional framework and high computational efficiency of the method for both parabolic and hyperbolic equations, which is the subject of a companion paper.
Keywords
lattice Boltzmann method
multiresolution analysis
wavelets
dynamic mesh adaptation
error control
hyperbolic conservation laws
MSC codes
76M28
65M50
42C40
65M12
35L65},
	number = {4},
	urldate = {2024-10-14},
	journal = {SIAM Journal on Scientific Computing},
	author = {Bellotti, Thomas and Gouarin, Loïc and Graille, Benjamin and Massot, Marc},
	month = aug,
	year = {2022},
	note = {Publisher: Society for Industrial and Applied Mathematics},
	pages = {A2599--A2627},
}

@article{bellotti_multidimensional_2022,
	title = {Multidimensional fully adaptive lattice {Boltzmann} methods with error control based on multiresolution analysis},
	volume = {471},
	issn = {0021-9991},
	url = {https://www.sciencedirect.com/science/article/pii/S0021999122007331},
	doi = {10.1016/j.jcp.2022.111670},
	abstract = {Lattice-Boltzmann methods are known for their simplicity, efficiency and ease of parallelization, usually relying on uniform Cartesian meshes with a strong bond between spatial and temporal discretization. This fact complicates the crucial issue of reducing the computational cost and the memory impact by automatically coarsening the grid where a fine mesh is unnecessary, still ensuring the overall quality of the numerical solution through error control. This work provides a possible answer to this interesting question, by connecting, for the first time, the field of lattice-Boltzmann Methods (LBM) to the adaptive multiresolution (MR) approach based on wavelets. To this end, we employ a MR multi-scale transform to adapt the mesh as the solution evolves in time according to its local regularity. The collision phase is not affected due to its inherent local nature and because we do not modify the speed of the sound, contrarily to most of the LBM/Adaptive Mesh Refinement (AMR) strategies proposed in the literature, thus preserving the original structure of any LBM scheme. Besides, an original use of the MR allows the scheme to resolve the proper physics by efficiently controlling the accuracy of the transport phase. We carefully test our method to conclude on its adaptability to a wide family of existing lattice Boltzmann schemes, treating both hyperbolic and parabolic systems of equations, thus being less problem-dependent than the AMR approaches, which have a hard time guaranteeing an effective control on the error. The ability of the method to yield a very efficient compression rate and thus a computational cost reduction for solutions involving localized structures with loss of regularity is also shown, while guaranteeing a precise control on the approximation error introduced by the spatial adaptation of the grid. The numerical strategy is implemented on a specific open-source platform called SAMURAI with a dedicated data-structure relying on set algebra.},
	urldate = {2024-10-14},
	journal = {Journal of Computational Physics},
	author = {Bellotti, Thomas and Gouarin, Loïc and Graille, Benjamin and Massot, Marc},
	month = dec,
	year = {2022},
	keywords = {Dynamic mesh adaptation, Error control, Hyperbolic systems of conservation laws, Incompressible Navier-Stokes equations, Lattice Boltzmann method, Multiresolution analysis},
	pages = {111670},
}

@inproceedings{jamond_manta_2022,
	address = {Giens, France},
	title = {{MANTA} : un code {HPC} généraliste pour la simulation de problèmes complexes en mécanique},
	shorttitle = {{MANTA}},
	url = {https://hal.science/hal-03688160},
	abstract = {Le code MANTA a l’ambition de permettre la réalisation de simulations complexes en mécanique sur des supercalculateurs actuels et futurs tout en préservant les fondamentaux des codes développés au CEA : adaptabilité au problème posé, robustesse des algorithmes, pérennité des modèles et du code. On expose les principes de développement de ce code de nouvelle génération, et quelques exemples représentatifs de ses capacités actuelles sont également décrits.},
	urldate = {2024-10-14},
	booktitle = {{CSMA} 2022 15ème {Colloque} {National} en {Calcul} des {Structures}},
	author = {Jamond, Olivier and Lelong, Nicolas and Fourmont, Axel and Bluthé, Joffrey and Breuze, Matthieu and Bouda, Pascal and Brooking, Guillaume and Drui, Florence and Epalle, Alexandre and Fandeur, Olivier and Folzan, Gauthier and Helfer, Thomas and Kloss, Francis and Latu, Guillaume and Motte, Antoine and Nahed, Christopher and Picard, Alexis and Prat, Raphael and Ramière, Isabelle and Steins, Morgane and Prabel, Benoit},
	month = may,
	year = {2022},
	keywords = {Code de calcul, Eléments finis, HPC, Implicite - explicite, Mécanique des fluides, Mécanique des structures, Toolbox, Volumes finis},
}

@inproceedings{jamond_manta_2024,
	address = {Giens, France},
	title = {{MANTA}: an industrial-strength open-source high performance explicit and implicit multi-physics solver},
	shorttitle = {{MANTA}},
	url = {https://hal.science/hal-04610968},
	urldate = {2024-10-14},
	booktitle = {16ème {Colloque} {National} en {Calcul} de {Structures}},
	publisher = {CNRS, CSMA, ENS Paris-Saclay, CentraleSupélec},
	author = {Jamond, Olivier and Lelong, Nicolas and Brooking, Guillaume and Helfer, Thomas and Prabel, Benoit and Prat, Raphael and Jaccon, Adrien},
	month = may,
	year = {2024},
	keywords = {HPC, Industrial applications, PDEs solving, fluid mechanics, multiphysics coupling, structural mechanics},
}

@misc{noauthor_16eme_nodate,
	title = {16ème {Colloque} {National} en {Calcul} de {Structures} - {Sciencesconf}.org},
	url = {https://csma2024.sciencesconf.org/517460},
	urldate = {2024-10-14},
}

@phdthesis{daver2016,
	type = {phd},
	title = {Reduced basis method applied to large non-linear multi-physics problems : application to high field magnets design},
	url = {http://www.theses.fr/2016STRAD019},
	author = {Daversin - Catty, Cécile},
	year = {2016},
	note = {tex.note+duplicate-1: 2016STRAD019},
}

@phdthesis{Hild2020,
	type = {phd},
	title = {Control and optimization of high magnetic fields},
	url = {http://www.theses.fr/2020STRAD031},
	author = {Hild, Romain},
	year = {2020},
	note = {tex.note+duplicate-1: 2020STRAD031},
}

@article{wang_fluid_2016,
	title = {Fluid and structure coupling analysis of the interaction between aqueous humor and iris},
	volume = {15},
	issn = {1475-925X},
	url = {http://biomedical-engineering-online.biomedcentral.com/articles/10.1186/s12938-016-0261-3},
	doi = {10.1186/s12938-016-0261-3},
	language = {en},
	number = {S2},
	urldate = {2024-10-14},
	journal = {BioMedical Engineering OnLine},
	author = {Wang, Wenjia and Qian, Xiuqing and Song, Hongfang and Zhang, Mindi and Liu, Zhicheng},
	month = dec,
	year = {2016},
	pages = {133},
}

@book{ansorge_programming_2022,
	edition = {1},
	title = {Programming in {Parallel} with {CUDA}: {A} {Practical} {Guide}},
	copyright = {https://www.cambridge.org/core/terms},
	isbn = {978-1-108-85527-3 978-1-108-47953-0},
	shorttitle = {Programming in {Parallel} with {CUDA}},
	url = {https://www.cambridge.org/core/product/identifier/9781108855273/type/book},
	abstract = {CUDA is now the dominant language used for programming GPUs, one of the most exciting hardware developments of recent decades. With CUDA, you can use a desktop PC for work that would have previously required a large cluster of PCs or access to a HPC facility. As a result, CUDA is increasingly important in scientific and technical computing across the whole STEM community, from medical physics and financial modelling to big data applications and beyond. This unique book on CUDA draws on the author's passion for and long experience of developing and using computers to acquire and analyse scientific data. The result is an innovative text featuring a much richer set of examples than found in any other comparable book on GPU computing. Much attention has been paid to the C++ coding style, which is compact, elegant and efficient. A code base of examples and supporting material is available online, which readers can build on for their own projects.},
	language = {en},
	urldate = {2024-10-11},
	publisher = {Cambridge University Press},
	author = {Ansorge, Richard},
	month = may,
	year = {2022},
	doi = {10.1017/9781108855273},
}

@article{noauthor_cuda_nodate,
	title = {{CUDA} {GRAPHS} in {GROMACS}},
	language = {en},
}

@article{schoonover_mpi_nodate,
	title = {{MPI}+ {Programming} with {HIP} and {OpenMP}},
	language = {en},
	author = {Schoonover, Dr Joe},
}

@article{edvalson_readthedocs-breathe_nodate,
	title = {{ReadTheDocs}-{Breathe} {Documentation}},
	language = {en},
	author = {Edvalson, Thomas},
}

@article{maia_rocm_nodate,
	title = {{ROCm}™ {Library} {Support} \& {Profiling} {Tools}},
	language = {en},
	author = {Maia, Julio and Chalmers, Noel and Bauman, Paul T and Curtis, Nicholas and Malaya, Nicholas and McDougall, Damon and van Oostrum, Rene},
}

@article{malavally_amd_nodate,
	title = {{AMD} {HIP} {Programming} {Guide}},
	language = {en},
	author = {Malavally, Roopa},
}

@article{noauthor_use_nodate,
	title = {Use {ROCm}™ on {Radeon}™ {GPUs} {Documentation}},
	language = {en},
}

@article{edvalson_readthedocs-breathe_nodate-1,
	title = {{ReadTheDocs}-{Breathe} {Documentation}},
	language = {en},
	author = {Edvalson, Thomas},
}

@article{noauthor_cuda_nodate-1,
	title = {{CUDA} {C}++ {Programming} {Guide}},
}

@article{parks_recycling_2006,
	title = {Recycling {Krylov} {Subspaces} for {Sequences} of {Linear} {Systems}},
	volume = {28},
	issn = {1064-8275, 1095-7197},
	url = {http://epubs.siam.org/doi/10.1137/040607277},
	doi = {10.1137/040607277},
	language = {en},
	number = {5},
	urldate = {2024-10-11},
	journal = {SIAM Journal on Scientific Computing},
	author = {Parks, Michael L. and De Sturler, Eric and Mackey, Greg and Johnson, Duane D. and Maiti, Spandan},
	month = jan,
	year = {2006},
	pages = {1651--1674},
}

@article{robbe_exact_2006,
	title = {Exact and inexact breakdowns in the block {GMRES} method},
	volume = {419},
	copyright = {https://www.elsevier.com/tdm/userlicense/1.0/},
	issn = {00243795},
	url = {https://linkinghub.elsevier.com/retrieve/pii/S0024379506002230},
	doi = {10.1016/j.laa.2006.04.018},
	language = {en},
	number = {1},
	urldate = {2024-10-11},
	journal = {Linear Algebra and its Applications},
	author = {Robbé, Mickaël and Sadkane, Miloud},
	month = nov,
	year = {2006},
	pages = {265--285},
}

@unpublished{saigre_coupled_2024_paper,
	type = {In preparation},
	title = {A coupled fluid-dynamics-heat transfer model for {3D} simulations of the aqueous humor flow in the human eye},
	abstract = {Understanding human eye behavior involves intricate interactions between physical phenomena such as heat transfer and fluid dynamics. Accurate computational models are vital for comprehending ocular diseases and therapeutic interventions.
This work focuses on modeling and simulating aqueous humor flow in the anterior and posterior chambers of the eye, coupled with overall heat transfer.
Aqueous humor dynamics regulates intraocular pressure, which is crucial for understanding conditions like glaucoma.
Convective effects from temperature disparities also influence this flow.
Extending prior research, this work develops a comprehensive three-dimensional computational model to simulate a coupled fluid-dynamic-heat transfer model, thus contributing to the understanding of ocular physiology.},
	author = {Saigre, Thomas and Chabannes, Vincent and Prud'Homme, Christophe and Szopos, Marcela},
}

@inproceedings{jolivet_block_2016,
	address = {Salt Lake City, Utah},
	series = {{SC} '16},
	title = {Block iterative methods and recycling for improved scalability of linear solvers},
	isbn = {9781467388153},
	abstract = {Contemporary large-scale Partial Differential Equation (PDE) simulations usually require the solution of large and sparse linear systems. Moreover, it is often needed to solve these linear systems with different or multiple Right-Hand Sides (RHSs). In this paper, various strategies will be presented to extend the scalability of existing multigrid or domain decomposition linear solvers using appropriate recycling strategies or block methods---i.e., by treating multiple right-hand sides simultaneously.The scalability of this work is assessed by performing simulations on up to 8,192 cores for solving linear systems arising from various physical phenomena modeled by Poisson's equation, the system of linear elasticity, or Maxwell's equation.This work is shipped as part of on open-source software, readily available and usable in any C/C++, Python, or Fortran code. In particular, some simulations are performed on top of a well-established library, PETSc, and it is shown how our approaches can be used to decrease time to solution down by 30\%.},
	urldate = {2024-10-10},
	booktitle = {Proceedings of the {International} {Conference} for {High} {Performance} {Computing}, {Networking}, {Storage} and {Analysis}},
	publisher = {IEEE Press},
	author = {Jolivet, Pierre and Tournier, Pierre-Henri},
	month = nov,
	year = {2016},
	pages = {1--14},
}

@inproceedings{jolivet_scalable_2013,
	address = {Denver Colorado},
	title = {Scalable domain decomposition preconditioners for heterogeneous elliptic problems},
	isbn = {9781450323789},
	url = {https://dl.acm.org/doi/10.1145/2503210.2503212},
	doi = {10.1145/2503210.2503212},
	language = {en},
	urldate = {2024-10-10},
	booktitle = {Proceedings of the {International} {Conference} on {High} {Performance} {Computing}, {Networking}, {Storage} and {Analysis}},
	publisher = {ACM},
	author = {Jolivet, Pierre and Hecht, Frédéric and Nataf, Frédéric and Prud'homme, Christophe},
	month = nov,
	year = {2013},
	pages = {1--11},
}

@article{jolivet_ksphpddm_2021,
	title = {{KSPHPDDM} and {PCHPDDM}: {Extending} {PETSc} with advanced {Krylov} methods and robust multilevel overlapping {Schwarz} preconditioners},
	volume = {84},
	issn = {08981221},
	shorttitle = {{KSPHPDDM} and {PCHPDDM}},
	url = {https://linkinghub.elsevier.com/retrieve/pii/S0898122121000055},
	doi = {10.1016/j.camwa.2021.01.003},
	language = {en},
	urldate = {2024-10-10},
	journal = {Computers \& Mathematics with Applications},
	author = {Jolivet, Pierre and Roman, Jose E. and Zampini, Stefano},
	month = feb,
	year = {2021},
	pages = {277--295},
}

@article{al_daas_multilevel_2021,
	title = {A {Multilevel} {Schwarz} {Preconditioner} {Based} on a {Hierarchy} of {Robust} {Coarse} {Spaces}},
	volume = {43},
	issn = {1064-8275, 1095-7197},
	url = {https://epubs.siam.org/doi/10.1137/19M1266964},
	doi = {10.1137/19M1266964},
	language = {en},
	number = {3},
	urldate = {2024-10-10},
	journal = {SIAM Journal on Scientific Computing},
	author = {Al Daas, Hussam and Grigori, Laura and Jolivet, Pierre and Tournier, Pierre-Henri},
	month = jan,
	year = {2021},
	pages = {A1907--A1928},
}

@book{bernardi_mathematics_2024,
	address = {Philadelphia, PA},
	title = {Mathematics and {Finite} {Element} {Discretizations} of {Incompressible} {Navier}—{Stokes} {Flows}},
	isbn = {9781611978117 9781611978124},
	url = {https://epubs.siam.org/doi/book/10.1137/1.9781611978124},
	language = {en},
	urldate = {2024-10-09},
	publisher = {Society for Industrial and Applied Mathematics},
	author = {Bernardi, Christine and Girault, Vivette and Hecht, Frédéric and Raviart, Pierre-Arnaud and Rivière, Beatrice},
	month = jan,
	year = {2024},
	doi = {10.1137/1.9781611978124},
}

@article{dapogny_geometrical_2018,
	title = {Geometrical shape optimization in fluid mechanics using {FreeFem}++},
	volume = {58},
	issn = {1615-147X, 1615-1488},
	url = {http://link.springer.com/10.1007/s00158-018-2023-2},
	doi = {10.1007/s00158-018-2023-2},
	language = {en},
	number = {6},
	urldate = {2024-10-09},
	journal = {Structural and Multidisciplinary Optimization},
	author = {Dapogny, Charles and Frey, Pascal and Omnès, Florian and Privat, Yannick},
	month = dec,
	year = {2018},
	pages = {2761--2788},
}

@article{zhu_89-line_2021,
	title = {An 89-line code for geometrically nonlinear topology optimization written in {FreeFEM}},
	volume = {63},
	issn = {1615-147X, 1615-1488},
	url = {https://link.springer.com/10.1007/s00158-020-02733-x},
	doi = {10.1007/s00158-020-02733-x},
	language = {en},
	number = {2},
	urldate = {2024-10-09},
	journal = {Structural and Multidisciplinary Optimization},
	author = {Zhu, Benliang and Zhang, Xianmin and Li, Hai and Liang, Junwen and Wang, Rixin and Li, Hao and Nishiwaki, Shinji},
	month = feb,
	year = {2021},
	pages = {1015--1027},
}

@article{sadaka_finite_2024,
	title = {A finite element toolbox for the {Bogoliubov}-de {Gennes} stability analysis of {Bose}-{Einstein} condensates},
	volume = {294},
	issn = {00104655},
	url = {https://linkinghub.elsevier.com/retrieve/pii/S001046552300293X},
	doi = {10.1016/j.cpc.2023.108948},
	language = {en},
	urldate = {2024-10-09},
	journal = {Computer Physics Communications},
	author = {Sadaka, Georges and Kalt, Victor and Danaila, Ionut and Hecht, Frédéric},
	month = jan,
	year = {2024},
	pages = {108948},
}

@article{golse_radiative_2023,
	title = {Radiative transfer for variable three-dimensional atmospheres},
	volume = {475},
	issn = {00219991},
	url = {https://linkinghub.elsevier.com/retrieve/pii/S0021999122009275},
	doi = {10.1016/j.jcp.2022.111864},
	language = {en},
	urldate = {2024-10-09},
	journal = {Journal of Computational Physics},
	author = {Golse, F. and Hecht, F. and Pironneau, O. and Smets, D. and Tournier, P.-H.},
	month = feb,
	year = {2023},
	pages = {111864},
}

@article{li_three-dimensional_2022,
	title = {Three-dimensional topology optimization of a fluid–structure system using body-fitted mesh adaption based on the level-set method},
	volume = {101},
	issn = {0307904X},
	url = {https://linkinghub.elsevier.com/retrieve/pii/S0307904X21003966},
	doi = {10.1016/j.apm.2021.08.021},
	language = {en},
	urldate = {2024-10-09},
	journal = {Applied Mathematical Modelling},
	author = {Li, Hao and Kondoh, Tsuguo and Jolivet, Pierre and Furuta, Kozo and Yamada, Takayuki and Zhu, Benliang and Izui, Kazuhiro and Nishiwaki, Shinji},
	month = jan,
	year = {2022},
	pages = {276--308},
}

@article{nataf_geneo_2024,
	title = {A {GenEO} {Domain} {Decomposition} method for {Saddle} {Point} problems},
	volume = {351},
	issn = {1873-7234},
	url = {https://comptes-rendus.academie-sciences.fr/mecanique/articles/10.5802/crmeca.175/},
	doi = {10.5802/crmeca.175},
	language = {en},
	number = {S1},
	urldate = {2024-10-09},
	journal = {Comptes Rendus. Mécanique},
	author = {Nataf, Frédéric and Tournier, Pierre-Henri},
	month = apr,
	year = {2024},
	pages = {667--684},
}

@article{tournier_three-dimensional_2022,
	title = {Three-dimensional finite-difference finite-element frequency-domain wave simulation with multi-level optimized additive {Schwarz} domain-decomposition preconditioner: {A} tool for {FWI} of sparse node datasets},
	issn = {0016-8033, 1942-2156},
	shorttitle = {Three-dimensional finite-difference finite-element frequency-domain wave simulation with multi-level optimized additive {Schwarz} domain-decomposition preconditioner},
	url = {https://library.seg.org/doi/10.1190/geo2021-0702.1},
	doi = {10.1190/geo2021-0702.1},
	abstract = {Efficient frequency-domain full-waveform inversion (FWI) of long-offset node data can be designed with a few discrete frequencies, which lead to modest data volumes to be managed during the inversion process. Moreover, attenuation effects can be straightforwardly implemented in the forward problem without the computational overhead. However, 3D frequency-domain seismic modeling is challenging because it requires solving a large and sparse linear indefinite system for each frequency with multiple right-hand sides (RHSs). This linear system can be solved by direct or iterative methods. The former allows efficient processing of multiple RHSs but may suffer from limited scalability for very large problems. Iterative methods equipped with a domain-decomposition preconditioner provide a suitable alternative to process large computational domains for sparse-node acquisition. We have investigated the domain-decomposition preconditioner based on the optimized restricted additive Schwarz (ORAS) method, in which a Robin or perfectly matched layer condition is implemented at the boundaries between the subdomains. The preconditioned system is solved by a Krylov subspace method, whereas a block low-rank lower-upper decomposition of the local matrices is performed at a preprocessing stage. Multiple sources are processed in groups with a pseudoblock method. The accuracy, the computational cost, and the scalability of the ORAS solver are assessed against several realistic benchmarks. In terms of discretization, we compare a compact wavelength-adaptive 27-point finite-difference stencil on a regular Cartesian grid with a P 
              3 
              finite-element method on h-adaptive tetrahedral mesh. Although both schemes have comparable accuracy, the former is more computationally efficient, the latter being beneficial to comply with known boundaries such as bathymetry. The scalability of the method, the block processing of multiple RHSs, and the straightforward implementation of attenuation, which further improves the convergence of the iterative solver, make the method a versatile forward engine for large-scale 3D FWI applications from sparse node data sets.},
	language = {en},
	urldate = {2024-10-09},
	journal = {GEOPHYSICS},
	author = {Tournier, Pierre-Henri and Jolivet, Pierre and Dolean, Victorita and Aghamiry, Hossein S. and Operto, Stéphane and Riffo, Sebastian},
	month = jul,
	year = {2022},
	pages = {1--84},
}

@article{tournier_numerical_2017,
	title = {Numerical {Modeling} and {High}-{Speed} {Parallel} {Computing}: {New} {Perspectives} on {Tomographic} {Microwave} {Imaging} for {Brain} {Stroke} {Detection} and {Monitoring}},
	volume = {59},
	issn = {1558-4143},
	shorttitle = {Numerical {Modeling} and {High}-{Speed} {Parallel} {Computing}},
	url = {https://ieeexplore.ieee.org/abstract/document/8014422#:~:text=10.1109/MAP.2017.2731199},
	doi = {10.1109/MAP.2017.2731199},
	abstract = {This article deals with microwave tomography for brain stroke imaging using state-of-the-art numerical modeling and massively parallel computing. Iterative microwave tomographic imaging requires the solution of an inverse problem based on a minimization algorithm (e.g., gradient based) with successive solutions of a direct problem such as the accurate modeling of a whole-microwave measurement system. Moreover, a sufficiently high number of unknowns is required to accurately represent the solution. As the system will be used for detecting a brain stroke (ischemic or hemorrhagic) as well as for monitoring during the treatment, the running times for the reconstructions should be reasonable. The method used is based on high-order finite elements, parallel preconditioners from the domain decomposition method and domain-specific language with the opensource FreeFEM++ solver.},
	number = {5},
	urldate = {2024-10-09},
	journal = {IEEE Antennas and Propagation Magazine},
	author = {Tournier, Pierre-Henri and Bonazzoli, Marcella and Dolean, Victorita and Rapetti, Francesca and Hecht, Frederic and Nataf, Frederic and Aliferis, Iannis and El Kanfoud, Ibtissam and Migliaccio, Claire and de Buhan, Maya and Darbas, Marion and Semenov, Serguei and Pichot, Christian},
	month = oct,
	year = {2017},
	keywords = {Antenna measurements, Boundary conditions, Brain modeling, Computational modeling, Finite element analysis, Tomography},
	pages = {98--110},
}

@article{sadaka_parallel_2020,
	title = {Parallel finite-element codes for the simulation of two-dimensional and three-dimensional solid–liquid phase-change systems with natural convection},
	volume = {257},
	issn = {00104655},
	url = {https://linkinghub.elsevier.com/retrieve/pii/S0010465520302319},
	doi = {10.1016/j.cpc.2020.107492},
	language = {en},
	urldate = {2024-10-09},
	journal = {Computer Physics Communications},
	author = {Sadaka, Georges and Rakotondrandisa, Aina and Tournier, Pierre-Henri and Luddens, Francky and Lothodé, Corentin and Danaila, Ionut},
	month = dec,
	year = {2020},
	pages = {107492},
}

@book{dolean_introduction_2015,
	address = {Philadelphia, PA},
	title = {An {Introduction} to {Domain} {Decomposition} {Methods}: {Algorithms}, {Theory}, and {Parallel} {Implementation}},
	isbn = {9781611974058 9781611974065},
	shorttitle = {An {Introduction} to {Domain} {Decomposition} {Methods}},
	url = {http://epubs.siam.org/doi/book/10.1137/1.9781611974065},
	language = {en},
	urldate = {2024-10-09},
	publisher = {Society for Industrial and Applied Mathematics},
	author = {Dolean, Victorita and Jolivet, Pierre and Nataf, Frédéric},
	month = nov,
	year = {2015},
	doi = {10.1137/1.9781611974065},
}

@book{hecht_pde-constrained_2024,
	title = {{PDE}-constrained optimization within {FreeFEM}},
	url = {https://hal.science/hal-04724788},
	abstract = {This book is aimed at students and researchers who want to learn how to eﬃciently solve constrained optimization problems involving partial diﬀerential equations (PDE) using the FreeFEM software.},
	urldate = {2024-10-09},
	author = {Hecht, Frédéric and Lance, Gontran and Trélat, Emmanuel},
	year = {2024},
}

@inproceedings{saigre_coupled_2024_abstract,
	address = {Arlington (Virginia), United States},
	title = {A coupled fluid-dynamics-heat transfer model for {3D} simulations of the aqueous humor flow in the human eye},
	url = {https://hal.science/hal-04558924},
	booktitle = {{CMBE24}},
	author = {Saigre, Thomas and Prud'Homme, Christophe and Szopos, Marcela and Chabannes, Vincent},
	month = jun,
	year = {2024},
	keywords = {Thermo-fluid dynamics, finite element method, mathematical and computational ophthalmology, thermo-fluid dynamics},
}

@article{giraud_block_2022,
	title = {A {Block} {Minimum} {Residual} {Norm} {Subspace} {Solver} with {Partial} {Convergence} {Management} for {Sequences} of {Linear} {Systems}},
	volume = {43},
	issn = {0895-4798, 1095-7162},
	url = {https://epubs.siam.org/doi/10.1137/21M1401127},
	doi = {10.1137/21M1401127},
	language = {en},
	number = {2},
	urldate = {2024-10-09},
	journal = {SIAM Journal on Matrix Analysis and Applications},
	author = {Giraud, Luc and Jing, Yan-Fei and Xiang, Yanfei},
	month = jun,
	year = {2022},
	pages = {710--739},
}

@article{agullo_robust_2019,
	title = {Robust {Preconditioners} via {Generalized} {Eigenproblems} for {Hybrid} {Sparse} {Linear} {Solvers}},
	volume = {40},
	issn = {0895-4798, 1095-7162},
	url = {https://epubs.siam.org/doi/10.1137/17M1153765},
	doi = {10.1137/17M1153765},
	language = {en},
	number = {2},
	urldate = {2024-10-09},
	journal = {SIAM Journal on Matrix Analysis and Applications},
	author = {Agullo, Emmanuel and Giraud, Luc and Poirel, Louis},
	month = jan,
	year = {2019},
	pages = {417--439},
}

@article{agullo_resiliency_2022,
	title = {Resiliency in numerical algorithm design for extreme scale simulations},
	volume = {36},
	issn = {1094-3420, 1741-2846},
	url = {https://journals.sagepub.com/doi/10.1177/10943420211055188},
	doi = {10.1177/10943420211055188},
	abstract = {This work is based on the seminar titled ‘Resiliency in Numerical Algorithm Design for Extreme Scale Simulations’ held March 1–6, 2020, at Schloss Dagstuhl, that was attended by all the authors. Advanced supercomputing is characterized by very high computation speeds at the cost of involving an enormous amount of resources and costs. A typical large-scale computation running for 48 h on a system consuming 20 MW, as predicted for exascale systems, would consume a million kWh, corresponding to about 100k Euro in energy cost for executing 10 
              23 
              floating-point operations. It is clearly unacceptable to lose the whole computation if any of the several million parallel processes fails during the execution. Moreover, if a single operation suffers from a bit-flip error, should the whole computation be declared invalid? What about the notion of reproducibility itself: should this core paradigm of science be revised and refined for results that are obtained by large-scale simulation? Naive versions of conventional resilience techniques will not scale to the exascale regime: with a main memory footprint of tens of Petabytes, synchronously writing checkpoint data all the way to background storage at frequent intervals will create intolerable overheads in runtime and energy consumption. Forecasts show that the mean time between failures could be lower than the time to recover from such a checkpoint, so that large calculations at scale might not make any progress if robust alternatives are not investigated. More advanced resilience techniques must be devised. The key may lie in exploiting both advanced system features as well as specific application knowledge. Research will face two essential questions: (1) what are the reliability requirements for a particular computation and (2) how do we best design the algorithms and software to meet these requirements? While the analysis of use cases can help understand the particular reliability requirements, the construction of remedies is currently wide open. One avenue would be to refine and improve on system- or application-level checkpointing and rollback strategies in the case an error is detected. Developers might use fault notification interfaces and flexible runtime systems to respond to node failures in an application-dependent fashion. Novel numerical algorithms or more stochastic computational approaches may be required to meet accuracy requirements in the face of undetectable soft errors. These ideas constituted an essential topic of the seminar. The goal of this Dagstuhl Seminar was to bring together a diverse group of scientists with expertise in exascale computing to discuss novel ways to make applications resilient against detected and undetected faults. In particular, participants explored the role that algorithms and applications play in the holistic approach needed to tackle this challenge. This article gathers a broad range of perspectives on the role of algorithms, applications and systems in achieving resilience for extreme scale simulations. The ultimate goal is to spark novel ideas and encourage the development of concrete solutions for achieving such resilience holistically.},
	language = {en},
	number = {2},
	urldate = {2024-10-09},
	journal = {The International Journal of High Performance Computing Applications},
	author = {Agullo, Emmanuel and Altenbernd, Mirco and Anzt, Hartwig and Bautista-Gomez, Leonardo and Benacchio, Tommaso and Bonaventura, Luca and Bungartz, Hans-Joachim and Chatterjee, Sanjay and Ciorba, Florina M and DeBardeleben, Nathan and Drzisga, Daniel and Eibl, Sebastian and Engelmann, Christian and Gansterer, Wilfried N and Giraud, Luc and Göddeke, Dominik and Heisig, Marco and Jézéquel, Fabienne and Kohl, Nils and Li, Xiaoye Sherry and Lion, Romain and Mehl, Miriam and Mycek, Paul and Obersteiner, Michael and Quintana-Ortí, Enrique S and Rizzi, Francesco and Rüde, Ulrich and Schulz, Martin and Fung, Fred and Speck, Robert and Stals, Linda and Teranishi, Keita and Thibault, Samuel and Thönnes, Dominik and Wagner, Andreas and Wohlmuth, Barbara},
	month = mar,
	year = {2022},
	pages = {251--285},
}

@article{agullo_soft_2020,
	title = {On {Soft} {Errors} in the {Conjugate} {Gradient} {Method}: {Sensitivity} and {Robust} {Numerical} {Detection}},
	volume = {42},
	issn = {1064-8275, 1095-7197},
	shorttitle = {On {Soft} {Errors} in the {Conjugate} {Gradient} {Method}},
	url = {https://epubs.siam.org/doi/10.1137/18M122858X},
	doi = {10.1137/18M122858X},
	language = {en},
	number = {6},
	urldate = {2024-10-09},
	journal = {SIAM Journal on Scientific Computing},
	author = {Agullo, Emmanuel and Cools, Siegfried and Yetkin, Emrullah Fatih and Giraud, Luc and Schenkels, Nick and Vanroose, Wim},
	month = jan,
	year = {2020},
	pages = {C335--C358},
}

@article{pham_assembling_2024,
	title = {Assembling algorithm for {Green}'s tensors and absorbing boundary conditions for {Galbrun}'s equation in radial symmetry},
	volume = {519},
	issn = {0021-9991},
	url = {https://www.sciencedirect.com/science/article/pii/S0021999124006922},
	doi = {10.1016/j.jcp.2024.113444},
	abstract = {Solar oscillations can be modeled by Galbrun's equation which describes Lagrangian wave displacement in a self-gravitating stratified medium. For spherically symmetric backgrounds, we construct an algorithm to compute efficiently and accurately the coefficients of the Green's tensor of the time-harmonic equation in vector spherical harmonic basis. With only two resolutions, our algorithm provides values of the kernels for all heights of source and receiver, and prescribes analytically the singularities of the kernels. We also derive absorbing boundary conditions (ABC) to model wave propagation in the atmosphere above the cut-off frequency. The construction of ABC, which contains varying gravity terms, is rendered difficult by the complex behavior of the solar potential in low atmosphere and for frequencies below the Lamb frequency. We carry out extensive numerical investigations to compare and evaluate the efficiency of the ABCs in capturing outgoing solutions. Finally, as an application towards helioseismology, we compute synthetic solar power spectra that contain pressure modes as well as internal-gravity (g-) and surface-gravity (f-) ridges which are missing in simpler approximations of the wave equation. For purpose of validation, the locations of the ridges in the synthetic power spectra are compared with observed solar modes.},
	urldate = {2024-10-09},
	journal = {Journal of Computational Physics},
	author = {Pham, Ha and Faucher, Florian and Fournier, Damien and Barucq, Hélène and Gizon, Laurent},
	month = dec,
	year = {2024},
	pages = {113444},
}

@book{elman_finite_2014,
	address = {Oxford},
	edition = {2. ed},
	series = {Numerical mathematics and scientific computation},
	title = {Finite elements and fast iterative solvers: with applications in incompressible fluid dynamics},
	isbn = {978-0-19-967879-2},
	shorttitle = {Finite elements and fast iterative solvers},
	language = {eng},
	publisher = {Oxford Univ. Press},
	author = {Elman, Howard C. and Silvester, David J. and Wathen, Andrew J.},
	year = {2014},
}

@article{prudhomme_reliable_2002,
	title = {Reliable {Real}-{Time} {Solution} of {Parametrized} {Partial} {Differential} {Equations}: {Reduced}-{Basis} {Output} {Bound} {Methods}},
	volume = {124},
	issn = {0098-2202, 1528-901X},
	shorttitle = {Reliable {Real}-{Time} {Solution} of {Parametrized} {Partial} {Differential} {Equations}},
	url = {https://asmedigitalcollection.asme.org/fluidsengineering/article/124/1/70/462808/Reliable-RealTime-Solution-of-Parametrized-Partial},
	doi = {10.1115/1.1448332},
	abstract = {We present a technique for the rapid and reliable prediction of linear-functional outputs of elliptic (and parabolic) partial differential equations with affine parameter dependence. The essential components are (i) (provably) rapidly convergent global reduced-basis approximations—Galerkin projection onto a space WN spanned by solutions of the governing partial differential equation at N selected points in parameter space; (ii) a posteriori error estimation—relaxations of the error-residual equation that provide inexpensive yet sharp and rigorous bounds for the error in the outputs of interest; and (iii) off-line/on-line computational procedures methods which decouple the generation and projection stages of the approximation process. The operation count for the on-line stage in which, given a new parameter value, we calculate the output of interest and associated error bound, depends only on N (typically very small) and the parametric complexity of the problem; the method is thus ideally suited for the repeated and rapid evaluations required in the context of parameter estimation, design, optimization, and real-time control.},
	language = {en},
	number = {1},
	journal = {Journal of Fluids Engineering},
	author = {Prud’homme, C. and Rovas, D. V. and Veroy, K. and Machiels, L. and Maday, Y. and Patera, A. T. and Turinici, G.},
	month = mar,
	year = {2002},
	pages = {70--80},
}

@article{Virieux2009,
	title = {An overview of full-waveform inversion in exploration geophysics},
	volume = {74},
	doi = {10.1190/1.3238367},
	number = {6},
	journal = {Geophysics},
	author = {Virieux, Jean and Operto, Stéphane},
	year = {2009},
	note = {Publisher: Society of Exploration Geophysicists},
	pages = {WCC1--WCC26},
}

@article{Pham2020Siam,
	title = {Efficient and accurate algorithm for the full modal {Green}'s kernel of the scalar wave equation in helioseismology},
	volume = {80},
	doi = {10.1137/20M1336709},
	number = {6},
	journal = {SIAM Journal on Applied Mathematics},
	author = {Barucq, Hélène and Faucher, Florian and Fournier, Damien and Gizon, Laurent and Pham, Ha},
	year = {2020},
	pages = {2657--2683},
}

@article{Pham2019radiationBC,
	title = {Outgoing solutions and radiation boundary conditions for the ideal atmospheric scalar wave equation in helioseismology},
	volume = {54},
	doi = {10.1051/m2an/2019088},
	number = {4},
	journal = {ESAIM: Mathematical Modelling and Numerical Analysis},
	author = {Barucq, Hélène and Faucher, Florian and Pham, Ha},
	year = {2020},
	pages = {1111--1138},
}

@article{Liu2024,
	title = {{WaveBench}: {Benchmarking} data-driven solvers for linear wave propagation {PDEs}},
	issn = {2835-8856},
	url = {https://openreview.net/forum?id=6wpInwnzs8},
	journal = {Transactions on Machine Learning Research},
	author = {Liu, Tianlin and Benitez, Jose Antonio Lara and Faucher, Florian and Khorashadizadeh, AmirEhsan and de Hoop, Maarten V. and Dokmanić, Ivan},
	year = {2024},
}

@article{Benitez2024,
	title = {Out-of-distributional risk bounds for neural operators with applications to the {Helmholtz} equation},
	doi = {10.1016/j.jcp.2024.113168},
	journal = {Journal of Computational Physics},
	author = {Benitez, Jose Antonio Lara and Furuya, Takashi and Faucher, Florian and Kratsios, Anastasis and Tricoche, Xavier and de Hoop, Maarten V},
	year = {2024},
	note = {Publisher: Elsevier},
	pages = {113168},
}

@article{Faucher2023viscoacoustic,
	title = {Quantitative inverse problem in visco-acoustic media under attenuation model uncertainty},
	volume = {472},
	doi = {10.1016/j.jcp.2022.111685},
	journal = {Journal of Computational Physics},
	author = {Faucher, Florian and Scherzer, Otmar},
	year = {2023},
	note = {Publisher: Elsevier},
	pages = {111685},
}

@article{Faucher2020DAS,
	title = {Reciprocity-gap misfit functional for {Distributed} {Acoustic} {Sensing}, combining data from passive and active sources},
	volume = {86},
	issn = {0016-8033},
	doi = {10.1190/geo2020-0305.1},
	number = {2},
	journal = {Geophysics},
	author = {Faucher, Florian and De Hoop, Maarten V and Scherzer, Otmar},
	year = {2020},
	pages = {1--46},
}

@article{Faucher2020adjoint,
	title = {Adjoint-state method for {Hybridizable} {Discontinuous} {Galerkin} discretization, application to the inverse acoustic wave problem},
	volume = {372},
	issn = {0045-7825},
	doi = {10.1016/j.cma.2020.113406},
	journal = {Computer Methods in Applied Mechanics and Engineering},
	author = {Faucher, Florian and Scherzer, Otmar},
	year = {2020},
	pages = {113406},
}

@article{Faucher2019FRgWIGeo,
	title = {Full {Reciprocity}-{Gap} {Waveform} {Inversion}, enabling sparse-source acquisition},
	volume = {85},
	doi = {10.1190/geo2019-0527.1},
	number = {6},
	journal = {Geophysics},
	author = {Faucher, Florian and Alessandrini, Giovanni and Barucq, Hélène and de Hoop, Maarten and Gaburro, Romina and Sincich, Eva},
	year = {2020},
	note = {Publisher: Society of Exploration Geophysicists},
	pages = {R461--R476},
}

@article{bonazzoli_domain_2019,
	title = {Domain decomposition preconditioning for the high-frequency time-harmonic {Maxwell} equations with absorption},
	volume = {88},
	copyright = {https://www.ams.org/publications/copyright-and-permissions},
	issn = {0025-5718, 1088-6842},
	url = {https://www.ams.org/mcom/2019-88-320/S0025-5718-2019-03447-6/},
	doi = {10.1090/mcom/3447},
	language = {en},
	number = {320},
	urldate = {2024-10-08},
	journal = {Mathematics of Computation},
	author = {Bonazzoli, M. and Dolean, V. and Graham, I. G. and Spence, E. A. and Tournier, P.-H.},
	month = may,
	year = {2019},
	pages = {2559--2604},
}

@article{noauthor_benchmarking_nodate,
	title = {Benchmarking analysis report},
	language = {en},
}

@book{asch_data_2016,
	address = {Philadelphia, PA},
	title = {Data assimilation},
	url = {https://epubs.siam.org/doi/abs/10.1137/1.9781611974546},
	publisher = {Society for Industrial and Applied Mathematics},
	author = {Asch, Mark and Bocquet, Marc and Nodet, Maëlle},
	year = {2016},
	note = {Citation Key: 
doi:10.1137/1.9781611974546
tex.eprint: https://epubs.siam.org/doi/pdf/10.1137/1.9781611974546},
}

@article{CRMATH_2009__347_7-8_435_0,
	title = {Une méthode combinée d'éléments finis à deux grilles/bases réduites pour l'approximation des solutions d'une {E}.{D}.{P}. paramétrique},
	volume = {347},
	url = {http://www.numdam.org/articles/10.1016/j.crma.2009.02.019/},
	doi = {10.1016/j.crma.2009.02.019},
	language = {fr},
	number = {7-8},
	journal = {Comptes Rendus. Mathématique},
	author = {Chakir, Rachida and Maday, Yvon},
	year = {2009},
	note = {Publisher: Elsevier},
	pages = {435--440},
}

@article{noauthor_notitle_nodate,
}

@article{calvin_object-oriented_2002,
	title = {An object-oriented approach to the design of fluid mechanics software},
	volume = {36},
	issn = {0764-583X, 1290-3841},
	url = {http://www.esaim-m2an.org/10.1051/m2an:2002038},
	doi = {10.1051/m2an:2002038},
	number = {5},
	urldate = {2024-10-07},
	journal = {ESAIM: Mathematical Modelling and Numerical Analysis},
	author = {Calvin, Christophe and Cueto, Olga and Emonot, Philippe},
	month = sep,
	year = {2002},
	pages = {907--921},
}

@misc{genci_cines,
	title = {Centre informatique national de l'{Enseignement} supérieur ({CINES})},
	url = {https://www.genci.fr/centre-informatique-national-de-lenseignement-superieur-cines},
	author = {{GENCI}},
	year = {2024},
	keywords = {cines, genci},
}

@misc{genci_tgcc,
	title = {Très grand centre de calcul du {CEA} ({TGCC})},
	url = {https://www.genci.fr/tres-grand-centre-de-calcul-du-cea-tgcc},
	author = {{GENCI}},
	year = {2024},
	keywords = {genci, tgcc},
}

@misc{genci_idris,
	title = {Institut du développement et des ressources en informatique scientifique ({IDRIS})},
	url = {https://www.genci.fr/institut-du-developpement-et-des-ressources-en-informatique-scientifique-idris},
	author = {{GENCI}},
	year = {2024},
	keywords = {genci, idris},
}

@misc{eurohpc_supercomputers,
	title = {{EuroHPC} supercomputers},
	url = {https://eurohpc-ju.europa.eu/supercomputers/our-supercomputers_en},
	author = {{EuroHPC JU}},
	year = {2024},
}

@article{cea_conception_1986,
	title = {Conception optimale ou identification de formes, calcul rapide de la dérivée directionnelle de la fonction coût},
	volume = {20},
	issn = {0764-583X, 1290-3841},
	url = {http://www.esaim-m2an.org/10.1051/m2an/1986200303711},
	doi = {10.1051/m2an/1986200303711},
	number = {3},
	urldate = {2024-10-07},
	journal = {ESAIM: Mathematical Modelling and Numerical Analysis},
	author = {Cea, Jean},
	year = {1986},
	pages = {371--402},
}

@mastersthesis{palazzolo2023shape,
	title = {Shape optimisation for rigid objects in a {Stokes} flow},
	school = {Internship report},
	author = {Palazzolo, Lucas},
	month = aug,
	year = {2023},
	note = {tex.supervisors: Luca Berti, Michaël Binois, Laetitia Giraldi, Christophe Prud’homme},
}

@article{pironneau_optimum_1974,
	title = {On optimum design in fluid mechanics},
	volume = {64},
	copyright = {https://www.cambridge.org/core/terms},
	issn = {0022-1120, 1469-7645},
	url = {https://www.cambridge.org/core/product/identifier/S0022112074002023/type/journal_article},
	doi = {10.1017/S0022112074002023},
	abstract = {In this paper, the change in energy dissipation due to a small hump on a body in a uniform steady flow is calculated. The result is used in conjunction with the variational methods of optimal control to obtain the optimality conditions for four minimum-drag problems of fluid mechanics. These conditions imply that the unit-area profile of smallest drag has a front end shaped like a wedge of angle 90°.},
	language = {en},
	number = {1},
	urldate = {2024-10-07},
	journal = {Journal of Fluid Mechanics},
	author = {Pironneau, O.},
	month = jun,
	year = {1974},
	pages = {97--110},
}

@phdthesis{saigre_mathematical_2024,
	address = {Strasbourg, France},
	type = {{PhD}},
	title = {Mathematical modeling, simulation, and order reduction of ocular fluid flows and their interactions: {Building} the digital twin of the eye},
	school = {Université de Strasbourg},
	author = {Saigre, Thomas},
	month = dec,
	year = {2024},
	note = {In preparation},
	keywords = {aqueous humor, heat transfer, model reduction, ocular fluid dynamics, reduced basis method, sensitivity analysis},
}

@unpublished{van_landeghem_motion_nodate,
	type = {Unpublished paper},
	title = {Motion of soft bodies in fluids in complex environments {Part} {I}: {Elasticity} modeling and simulation},
	author = {Van Landeghem, Céline and Prud'homme, Christophe and Chabannes, Vincent and Giraldi, Laetitia and Chouippe, Agathe},
}

@article{prudhomme_feel_2012,
	title = {Feel++ : {A} computational framework for {Galerkin} {Methods} and {Advanced} {Numerical} {Methods}},
	volume = {38},
	issn = {1270-900X},
	shorttitle = {Feel++},
	url = {http://www.esaim-proc.org/10.1051/proc/201238024},
	doi = {10.1051/proc/201238024},
	urldate = {2024-10-07},
	journal = {ESAIM: Proceedings},
	author = {Prud’homme, Christophe and Chabannes, Vincent and Doyeux, Vincent and Ismail, Mourad and Samake, Abdoulaye and Pena, Goncalo},
	editor = {Coquel, F. and Gutnic, M. and Helluy, P. and Lagoutière, F. and Rohde, C. and Seguin, N.},
	month = dec,
	year = {2012},
	keywords = {dsel, feelpp},
	pages = {429--455},
}

@article{saikali_highly_2019,
	title = {Highly resolved large eddy simulations of a binary mixture flow in a cavity with two vents: {Influence} of the computational domain},
	volume = {44},
	issn = {03603199},
	shorttitle = {Highly resolved large eddy simulations of a binary mixture flow in a cavity with two vents},
	url = {https://linkinghub.elsevier.com/retrieve/pii/S0360319918326521},
	doi = {10.1016/j.ijhydene.2018.08.108},
	language = {en},
	number = {17},
	urldate = {2024-10-06},
	journal = {International Journal of Hydrogen Energy},
	author = {Saikali, E. and Bernard-Michel, G. and Sergent, A. and Tenaud, C. and Salem, R.},
	month = apr,
	year = {2019},
	keywords = {trust},
	pages = {8856--8873},
}

@article{angeli_wall-resolved_2022,
	title = {Wall-{Resolved} {Large} {Eddy} {Simulations} of the {Transient} {Turbulent} {Fluid} {Mixing} in a {Closed} {System} {Replicating} a {Pressurized} {Thermal} {Shock}},
	volume = {108},
	issn = {1386-6184, 1573-1987},
	url = {https://link.springer.com/10.1007/s10494-021-00272-z},
	doi = {10.1007/s10494-021-00272-z},
	language = {en},
	number = {1},
	urldate = {2024-10-06},
	journal = {Flow, Turbulence and Combustion},
	author = {Angeli, Pierre-Emmanuel},
	month = jan,
	year = {2022},
	keywords = {trust},
	pages = {43--75},
}

@article{chouly_explicit_2018,
	title = {Explicit {Verlet} time-integration for a {Nitsche}-based approximation of elastodynamic contact problems},
	volume = {5},
	journal = {Advanced Modeling and Simulation in Engineering Sciences},
	author = {Chouly, Franz and Renard, Yves},
	year = {2018},
	note = {Publisher: Springer},
	pages = {1--38},
}

@misc{balay_petsc_2024,
	title = {{PETSc} {Web} page},
	url = {https://petsc.org/},
	author = {Balay, Satish and Abhyankar, Shrirang and Adams, Mark F. and Benson, Steven and Brown, Jed and Brune, Peter and Buschelman, Kris and Constantinescu, Emil M. and Dalcin, Lisandro and Dener, Alp and Eijkhout, Victor and Faibussowitsch, Jacob and Gropp, William D. and Hapla, Václav and Isaac, Tobin and Jolivet, Pierre and Karpeev, Dmitry and Kaushik, Dinesh and Knepley, Matthew G. and Kong, Fande and Kruger, Scott and May, Dave A. and McInnes, Lois Curfman and Mills, Richard Tran and Mitchell, Lawrence and Munson, Todd and Roman, Jose E. and Rupp, Karl and Sanan, Patrick and Sarich, Jason and Smith, Barry F. and Zampini, Stefano and Zhang, Hong and Zhang, Hong and Zhang, Junchao},
	year = {2024},
}

@article{bruna_neural_2024,
	title = {Neural {Galerkin} schemes with active learning for high-dimensional evolution equations},
	volume = {496},
	issn = {0021-9991},
	doi = {10.1016/j.jcp.2023.112588},
	journal = {Journal of Computational Physics},
	author = {Bruna, J. and Peherstorfer, B. and Vanden-Eijnden, E.},
	year = {2024},
	note = {Publisher: Elsevier BV},
	pages = {112588},
}

@article{lu_learning_2021,
	title = {Learning nonlinear operators via {DeepONet} based on the universal approximation theorem of operators},
	volume = {3},
	issn = {2522-5839},
	doi = {10.1038/s42256-021-00302-5},
	number = {3},
	journal = {Nat. Mach. Intell.},
	author = {Lu, L. and Jin, P. and Pang, G. and Zhang, Z. and Karniadakis, G. E.},
	year = {2021},
	note = {Publisher: Springer Science and Business Media LLC},
	pages = {218--229},
}

@article{karniadakis_physics-informed_2021,
	title = {Physics-informed machine learning},
	volume = {3},
	issn = {2522-5820},
	doi = {10.1038/s42254-021-00314-5},
	number = {6},
	journal = {Nat. Rev. Phys.},
	author = {Karniadakis, G. E. and Kevrekidis, I. G. and Lu, L. and Perdikaris, P. and Wang, S. and Yang, L.},
	year = {2021},
	note = {Publisher: Springer Science and Business Media LLC},
	pages = {422--440},
}

@misc{saigre_mesh_2024,
	title = {Mesh and configuration files to perform coupled heat+fluid simulations on a realistic human eyeball geometry with {Feel}++},
	copyright = {Creative Commons Attribution 4.0 International},
	url = {https://zenodo.org/doi/10.5281/zenodo.13886143},
	doi = {10.5281/ZENODO.13886143},
	abstract = {Run the simulation

With slurm

Set up position and desired mesh in the `run.slurm` file. Then, submit the job with the following command:

sbatch run.slurm

Without slurm

Run by hand the command of the run.slurm file.POSITION=prone      \# prone supine standingSOLVER\_TYPE=simple  \# simple lscMESH\_INDEX=M4       \# M1 M2 M3 M4 M5

mpirun -np 128 feelpp\_toolbox\_heatfluid {\textbackslash}    --config-files eye-\$\{POSITION\}.cfg pc\_\$\{SOLVER\_TYPE\}.cfg {\textbackslash}    --heat-fluid.json.patch='\{ "op": "replace", "path": "/Meshes/heatfluid/Import/filename", "value": "\$cfgdir/mesh/Mr/'\$\{MESH\_INDEX\}'/Eye\_Mesh3D\_p\$np.json" \}' {\textbackslash}    --heat-fluid.scalability-save=1 --heat-fluid.heat.scalability-save=1 --heat-fluid.fluid.scalability-save=1

Available meshes

The meshes are available and are already partitioned for parallel computing:

M0 : 1, 64, 128, 256, 384, 512, 640, 768M1 : 1, 64, 128, 256, 384, 512, 640, 768M2 : 1, 64, 128, 256, 384, 512, 640, 768M3 : 1, 64, 128, 256, 384, 512, 640, 768M4 : 1, 64, 128, 256, 384, 512, 640, 768M5 : 1, 64, 128, 256, 384, 512, 640, 768M6 : 128, 256, 384, 512, 640, 768},
	urldate = {2024-10-04},
	publisher = {Zenodo},
	author = {Saigre, Thomas and Prud'homme, Christophe and Szopos, Marcela and Chabannes, Vincent},
	month = oct,
	year = {2024},
}

@incollection{baudin_openturns_2016,
	address = {Cham},
	title = {{OpenTURNS}: {An} {Industrial} {Software} for {Uncertainty} {Quantification} in {Simulation}},
	isbn = {978-3-319-11259-6},
	url = {https://doi.org/10.1007/978-3-319-11259-6_64-1},
	booktitle = {Handbook of {Uncertainty} {Quantification}},
	publisher = {Springer International Publishing},
	author = {Baudin, Michaël and Dutfoy, Anne and Iooss, Bertrand and Popelin, Anne-Laure},
	editor = {Ghanem, Roger and Higdon, David and Owhadi, Houman},
	year = {2016},
	doi = {10.1007/978-3-319-11259-6_64-1},
	pages = {1--38},
}

@misc{prudhomme_feelppfeelpp_2024,
	title = {feelpp/feelpp: {Feel}++ {Release} {V111} preview.10},
	copyright = {Creative Commons Attribution 4.0 International, GNU Lesser General Public License v3.0 or later, GNU General Public License v3.0 or later},
	shorttitle = {feelpp/feelpp},
	url = {https://zenodo.org/doi/10.5281/zenodo.591797},
	abstract = {🎉 We're happy to share our developments as we approach the V111 release of Feel++. Following a refreshed naming strategy, we've moved to the -preview.x suffix from the conventional -alpha.x, -beta, or -rc labels. This change signifies our dedication to enhancing transparency and setting clear expectations for our pre-release versions.

Each pre-release version of Feel++ undergoes a rigorous process, encompassing detailed reviews, extensive tests across varied scenarios, and careful packaging. Our commitment to delivering a high-quality, reliable experience is reflected in our comprehensive platform support strategy. Alongside offering support for the latest two Long-Term Support (LTS) versions of Ubuntu and the newest LTS version of Debian, we're excited to announce that Feel++ is now accessible to Windows users through the Windows Subsystem for Linux (WSL) and to Mac users via MacPorts, Homebrew, Docker and now Apptainer. This expansion of platform support is a testament to our commitment to making Feel++ as accessible and versatile as possible for our diverse user base.

As we continue to refine and enhance Feel++, the V111 release promises to bring forward significant innovations and improvements. Stay tuned for further updates of Feel++.

Packages


📦 Ubuntu packages

📦 Debian packages

📦 Docker images


docker pull ghcr.io/feelpp/feelpp:v0.111.0-preview.10-jammy
docker run ghcr.io/feelpp/feelpp:v0.111.0-preview.10-jammy ls


📦 Apptainer images


apptainer pull -F oras://ghcr.io/feelpp/feelpp:v0.111.0-preview.10-jammy-sif
apptainer exec feelpp\_v0.111.0-preview.10-jammy-sif.sif feelpp\_toolbox\_fluid --version


What's Changed

Exciting New Features 🎉


resolve 2231 : Support parts configuration in exporter by @vincentchabannes in https://github.com/feelpp/feelpp/pull/2232

resolves 1489 and 2175: enrich range object and simplify FunctionSpace by @prudhomm in https://github.com/feelpp/feelpp/pull/2176

resolves 2191 and 2196: cleanup and python wrapper for forms and implement feelpp namespace package by @prudhomm in https://github.com/feelpp/feelpp/pull/2227

resolves 2233: improve hdg toolbox, add new terms by @prudhomm in https://github.com/feelpp/feelpp/pull/2236

resolves 2259: add script to get feelpp version and improve packaging workflow by @prudhomm in https://github.com/feelpp/feelpp/pull/2260


HPC Changes


resolves 2246: fix non blocking mpi communication for large scale communications by @vincentchabannes in https://github.com/feelpp/feelpp/pull/2249


Recent Publications using Feel++


Ktirio Urban Building: A Computational Framework for City Energy Simulations Enhanced by CI/CD Innovations on EuroHPC Systems

Nonlinear compressive reduced basis approximation for multi-parameter elliptic problem

2D Axisymmetric Modeling of the HTS Insert Nougat in a Background Magnetic Field Generated by Resistive Magnet


Enjoy!

Full Changelog: https://github.com/feelpp/feelpp/compare/v0.111.0-preview.9...v0.111.0-preview.10},
	urldate = {2024-09-04},
	publisher = {Cemosis},
	author = {Prud'homme, Christophe and Chabannes, Vincent and Saigre, Thomas and Trophime, Christophe and Berti, Luca and Samaké, Abdoulaye and Van Landeghem, Céline and Szopos, Marcela and Giraldi, Laetitia and Bertoluzza, Silvia and Maday, Yvon},
	month = jul,
	year = {2024},
	doi = {10.5281/ZENODO.591797},
}

@misc{chabannes_3d_2024,
	title = {A {3D} geometrical model and meshing procedures for the human eyeball},
	copyright = {Creative Commons Attribution 4.0 International},
	url = {https://zenodo.org/doi/10.5281/zenodo.13829740},
	abstract = {What's Changed


up README with author + sort cff by @prudhomm in https://github.com/feelpp/mesh.eye/pull/2


New Contributors


@prudhomm made their first contribution in https://github.com/feelpp/mesh.eye/pull/2


Full Changelog: https://github.com/feelpp/mesh.eye/compare/1.0.0-preview.1...v1.0.0-preview.2},
	urldate = {2024-10-04},
	publisher = {Zenodo},
	author = {Chabannes, Vincent and Prud'homme, Christophe and Saigre, Thomas and Lorenzo, Sala and Szopos, Marcela and Trophime, Christophe},
	month = sep,
	year = {2024},
	doi = {10.5281/ZENODO.13829740},
}

@misc{noauthor_master-csmioverfitting-underfitting_nodate,
	title = {master-csmi/overfitting-underfitting},
	url = {https://github.com/master-csmi/overfitting-underfitting},
	urldate = {2024-10-03},
}

@article{ooi_simulation_2008,
	title = {Simulation of aqueous humor hydrodynamics in human eye heat transfer},
	volume = {38},
	copyright = {https://www.elsevier.com/tdm/userlicense/1.0/},
	issn = {00104825},
	url = {https://linkinghub.elsevier.com/retrieve/pii/S001048250700176X},
	doi = {10.1016/j.compbiomed.2007.10.007},
	language = {en},
	number = {2},
	urldate = {2024-10-03},
	journal = {Computers in Biology and Medicine},
	author = {Ooi, Ean-Hin and Ng, Eddie Yin-Kwee},
	month = feb,
	year = {2008},
	pages = {252--262},
}

@incollection{kilgour_operator_2021,
	address = {Cham},
	title = {Operator {Splitting} for the {Simulation} of {Aqueous} {Humor} {Thermo}-{Fluid}-{Dynamics} in the {Anterior} {Chamber}},
	volume = {343},
	isbn = {978-3-030-63590-9 978-3-030-63591-6},
	url = {https://link.springer.com/10.1007/978-3-030-63591-6_45},
	language = {en},
	urldate = {2024-10-03},
	booktitle = {Recent {Developments} in {Mathematical}, {Statistical} and {Computational} {Sciences}},
	publisher = {Springer International Publishing},
	author = {Abdelhafid, Farah and Guidoboni, Giovanna and Okumura, Naoki and Koizumi, Noriko and Srinivas, Sangly P.},
	editor = {Kilgour, D. Marc and Kunze, Herb and Makarov, Roman and Melnik, Roderick and Wang, Xu},
	year = {2021},
	doi = {10.1007/978-3-030-63591-6_45},
	note = {Series Title: Springer Proceedings in Mathematics \& Statistics},
	pages = {489--499},
}

@article{portaneri_alpha_2022,
	title = {Alpha {Wrapping} with an {Offset}},
	volume = {41},
	url = {https://inria.hal.science/hal-03688637},
	doi = {10.1145/3528223.3530152},
	abstract = {Given an input 3D geometry such as a triangle soup or a point set, we address the problem of generating a watertight and orientable surface triangle mesh that strictly encloses the input. The output mesh is obtained by greedily refining and carving a 3D Delaunay triangulation on an offset surface of the input, while carving with empty balls of radius alpha. The proposed algorithm is controlled via two user-defined parameters: alpha and offset. Alpha controls the size of cavities or holes that cannot be traversed during carving, while offset controls the distance between the vertices of the output mesh and the input. Our algorithm is guaranteed to terminate and to yield a valid and strictly enclosing mesh, even for defect-laden inputs. Genericity is achieved using an abstract interface probing the input, enabling any geometry to be used, provided a few basic geometric queries can be answered. We benchmark the algorithm on large public datasets such as Thingi10k, and compare it to state-of-the-art approaches in terms of robustness, approximation, output complexity, speed, and peak memory consumption. Our implementation is available through the CGAL library.},
	language = {en},
	number = {4},
	urldate = {2024-10-02},
	journal = {ACM Transactions on Graphics},
	author = {Portaneri, Cédric and Rouxel-Labbé, Mael and Hemmer, Michael and Cohen-Steiner, David and Alliez, Pierre},
	month = jun,
	year = {2022},
	keywords = {cgal},
	pages = {1},
}

@article{jamin_cgalmesh_2015,
	title = {{CGALmesh}: a {Generic} {Framework} for {Delaunay} {Mesh} {Generation}},
	volume = {41},
	shorttitle = {{CGALmesh}},
	url = {https://inria.hal.science/hal-01071759},
	doi = {10.1145/2699463},
	abstract = {CGALmesh is the mesh generation software package of the Computational Geometry Algorithm Library (CGAL). It generates isotropic simplicial meshes -- surface triangular meshes or volume tetrahedral meshes -- from input surfaces, 3D domains as well as 3D multi-domains, with or without sharp features. The underlying meshing algorithm relies on restricted Delaunay triangulations to approximate domains and surfaces, and on Delaunay refinement to ensure both approximation accuracy and mesh quality. CGALmesh provides guarantees on approximation quality as well as on the size and shape of the mesh elements. It provides four optional mesh optimization algorithms to further improve the mesh quality. A distinctive property of CGALmesh is its high flexibility with respect to the input domain representation. Such a flexibility is achieved through a careful software design, gathering into a single abstract concept, denoted by the oracle, all required interface features between the meshing engine and the input domain. We already provide oracles for domains defined by polyhedral and implicit surfaces.},
	language = {en},
	number = {4},
	urldate = {2024-10-02},
	journal = {ACM Transactions on Mathematical Software},
	author = {Jamin, Clément and Alliez, Pierre and Yvinec, Mariette and Boissonnat, Jean-Daniel},
	year = {2015},
	keywords = {cgal},
	pages = {24},
}

@book{the_cgal_project_cgal_2024,
	edition = {5.6.1},
	title = {{CGAL} {User} and {Reference} {Manual}},
	url = {https://doc.cgal.org/5.6.1/Manual/packages.html},
	publisher = {CGAL Editorial Board},
	author = {{The CGAL Project}},
	year = {2024},
	keywords = {cgal},
}

@incollection{alliez_3d_2024,
	edition = {6.0},
	title = {{3D} mesh generation},
	url = {https://doc.cgal.org/6.0/Manual/packages.html#PkgMesh3},
	booktitle = {{CGAL} user and reference manual},
	publisher = {CGAL Editorial Board},
	author = {Alliez, Pierre and Jamin, Clément and Rineau, Laurent and Tayeb, Stéphane and Tournois, Jane and Yvinec, Mariette},
	year = {2024},
	keywords = {cgal},
}

@incollection{alliez_3d_2024-1,
	edition = {5.6.1},
	title = {{3D} {Alpha} {Wrapping}},
	url = {https://doc.cgal.org/5.6.1/Manual/packages.html#PkgAlphaWrap3},
	booktitle = {{CGAL} {User} and {Reference} {Manual}},
	publisher = {CGAL Editorial Board},
	author = {Alliez, Pierre and Cohen-Steiner, David and Hemmer, Michael and Portaneri, Cédric and Rouxel-Labbé, Mael},
	year = {2024},
	keywords = {cgal},
}

@inproceedings{chabannes_high_2017,
	address = {Pittsburgh, PA, United States},
	title = {High order finite element simulations for fluid dynamics validated by experimental data from the fda benchmark nozzle model},
	url = {https://hal.science/hal-01429685},
	booktitle = {5th {International} {Conference} on {Computational} and {Mathematical} {Biomedical} {Engineering} - {CMBE2017}},
	author = {Chabannes, Vincent and Prud'Homme, Christophe and Szopos, Marcela and Tarabay, Ranine},
	month = apr,
	year = {2017},
	keywords = {CFD, medical device, open source finite element software, validation},
}

@article{stewart_assessment_2012,
	title = {Assessment of {CFD} {Performance} in {Simulations} of an {Idealized} {Medical} {Device}: {Results} of {FDA}’s {First} {Computational} {Interlaboratory} {Study}},
	volume = {3},
	issn = {1869-408X},
	url = {http://dx.doi.org/10.1007/s13239-012-0087-5},
	doi = {10.1007/s13239-012-0087-5},
	number = {2},
	journal = {Cardiovascular Engineering and Technology},
	author = {Stewart, SandyF.C. and Paterson, EricG. and Burgreen, GregW. and Hariharan, Prasanna and Giarra, Matthew and Reddy, Varun and Day, StevenW. and Manning, KeefeB. and Deutsch, Steven and Berman, MichaelR. and Myers, MatthewR. and Malinauskas, RichardA.},
	year = {2012},
	keywords = {Blood damage, Computational fluid dynamics, Experimental validation, FDA, Medical devices},
	pages = {139--160},
}

@article{hariharan_multilaboratory_2011,
	title = {Multilaboratory {Particle} {Image} {Velocimetry} {Analysis} of the {FDA} {Benchmark} {Nozzle} {Model} to {Support} {Validation} of {Computational} {Fluid} {Dynamics} {Simulations}},
	volume = {133},
	issn = {0148-0731},
	url = {http://dx.doi.org/10.1115/1.4003440},
	doi = {doi: 10.1115/1.4003440},
	journal = {Journal of Biomechanical Engineering},
	author = {Hariharan, Prasanna and Giarra, Matthew and Reddy, Varun and Day, Steven W. and Manning, Keefe B. and Deutsch, Steven and Stewart, Sandy F. C. and Myers, Matthew R. and Berman, Michael R. and Burgreen, Greg W. and Paterson, Eric G. and Malinauskas, Richard A.},
	month = feb,
	year = {2011},
	keywords = {FDA},
}

@article{feppon_f_null_2020,
	title = {Null space gradient flows for constrained optimization with applications to shape optimization},
	volume = {26},
	url = {https://doi.org/10.1051/cocv/2020015},
	doi = {10.1051/cocv/2020015},
	journal = {ESAIM: COCV},
	author = {{Feppon, F.} and {Allaire, G.} and {Dapogny, C.}},
	year = {2020},
	keywords = {multiphysics, shape optimisation},
	pages = {90},
}

@article{feppon_shape_2019,
	title = {Shape optimization of a coupled thermal fluid-structure problem in a level set mesh evolution framework},
	volume = {76},
	issn = {2254-3902},
	doi = {10.1007/s40324-018-00185-4},
	number = {3},
	journal = {SeMA},
	author = {Feppon, F. and Allaire, G. and Bordeu, F. and Cortial, J. and Dapogny, C.},
	month = sep,
	year = {2019},
	note = {Publisher: Springer International Publishing},
	keywords = {fsi, multiphysics, shape optimisation},
	pages = {413--458},
}

@phdthesis{feppon_shape_2019-1,
	type = {{PhD} {Thesis}},
	title = {Shape and topology optimization of multiphysics systems},
	school = {Thèse de doctorat de l'Universit'e Paris-Saclay pr'epar'ee à l”Ecole polytechnique},
	author = {Feppon, Florian},
	year = {2019},
	keywords = {multiphysics, shape optimisation},
}

@misc{noauthor_iso_2017,
	title = {{ISO} 10211:2017 - {Thermal} bridges in building construction — {Heat} flows and surface temperatures — {Detailed} calculations},
	url = {https://www.iso.org/standard/65710.html},
	year = {2017},
	keywords = {building construction, detailed calculations, heat flows, surface temperatures, thermal bridges},
}

@book{advanced_micro_devices_inc_hip_2024,
	edition = {Release 6.1.40091},
	title = {{HIP} {Documentation}},
	url = {https://rocm.docs.amd.com/projects/HIP/en/latest/index.html},
	author = {{Advanced Micro Devices, Inc.}},
	month = may,
	year = {2024},
	keywords = {AMD, GPU, HIP},
}

@book{advanced_micro_devices_inc_rocthrust_2024,
	edition = {Release 3.0.1},
	title = {{rocThrust} {Documentation}},
	url = {https://rocm.docs.amd.com/projects/rocThrust/en/latest/index.html},
	author = {{Advanced Micro Devices, Inc.}},
	month = aug,
	year = {2024},
	keywords = {AMD, gpu, rocm},
}

@article{van_landeghem_mathematical_2024,
	title = {Mathematical and computational framework for moving and colliding rigid bodies in a {Newtonian} fluid},
	volume = {9},
	issn = {2380288X, 23802898},
	url = {https://www.intlpress.com/site/pub/pages/journals/items/amsa/content/vols/0009/0001/a002/},
	doi = {10.4310/AMSA.2024.v9.n1.a2},
	number = {1},
	urldate = {2024-05-30},
	journal = {Annals of Mathematical Sciences and Applications},
	author = {Van Landeghem, Céline and Berti, Luca and Chabannes, Vincent and Chouippe, Agathe and Giraldi, Laetitia and Hoarau, Yannick and Prud’homme, Christophe},
	year = {2024},
	pages = {59--89},
}

@inproceedings{firmin_comparative_2023,
	series = {Communications in {Computer} and {Information} {Science}},
	title = {A {Comparative} {Study} of {Fractal}-{Based} {Decomposition} {Optimization}},
	volume = {1824},
	url = {https://doi.org/10.1007/978-3-031-34020-8\_1},
	doi = {10.1007/978-3-031-34020-8_1},
	booktitle = {Optimization and {Learning} - 6th {International} {Conference}, {OLA} 2023, {Malaga}, {Spain}, {May} 3-5, 2023, {Proceedings}},
	publisher = {Springer},
	author = {Firmin, Thomas and Talbi, El-Ghazali},
	editor = {Dorronsoro, Bernabé and Chicano, Francisco and Danoy, Grégoire and Talbi, El-Ghazali},
	year = {2023},
	pages = {3--20},
}

@inproceedings{firmin_massively_2023,
	title = {Massively {Parallel} {Asynchronous} {Fractal} {Optimization}},
	doi = {10.1109/IPDPSW59300.2023.00151},
	booktitle = {2023 {IEEE} {International} {Parallel} and {Distributed} {Processing} {Symposium} {Workshops} ({IPDPSW})},
	author = {Firmin, Thomas and Talbi, El-Ghazali},
	year = {2023},
	keywords = {Asynchronous metaheuristic, Conferences, Continuous optimization, Distributed processing, Fractals, Hierarchical decomposition, Linear programming, Search problems, Software, Software algorithms},
	pages = {930--938},
}

@article{blanchard_uranie_2019,
	title = {The {Uranie} platform: an open-source software for optimisation, meta-modelling and uncertainty analysis},
	volume = {5},
	copyright = {© J.-B. Blanchard et al., published by EDP Sciences, 2019},
	issn = {2491-9292},
	shorttitle = {The {Uranie} platform},
	url = {https://www.epj-n.org/articles/epjn/abs/2019/01/epjn180009/epjn180009.html},
	doi = {10.1051/epjn/2018050},
	abstract = {The high-performance computing resources and the constant improvement of both numerical simulation accuracy and the experimental measurements with which they are confronted bring a new compulsory step to strengthen the credence given to the simulation results: uncertainty quantification. This can have different meanings, according to the requested goals (rank uncertainty sources, reduce them, estimate precisely a critical threshold or an optimal working point), and it could request mathematical methods with greater or lesser complexity. This paper introduces the Uranie platform, an open-source framework developed at the Alternative Energies and Atomic Energy Commission (CEA), in the nuclear energy division, in order to deal with uncertainty propagation, surrogate models, optimisation issues, code calibration, etc. This platform benefits from both its dependencies and from personal developments, to offer an efficient data handling model, a C++ and Python interface, advanced graphi graphical tools, several parallelisation solutions, etc. These methods can then be applied to many kinds of code (considered as black boxes by Uranie) so to many fields of physics as well. In this paper, the example of thermal exchange between a plate-sheet and a fluid is introduced to show how Uranie can be used to perform a large range of analysis.},
	language = {en},
	urldate = {2024-09-30},
	journal = {EPJ Nuclear Sciences \& Technologies},
	author = {Blanchard, Jean-Baptiste and Damblin, Guillaume and Martinez, Jean-Marc and Arnaud, Gilles and Gaudier, Fabrice},
	year = {2019},
	pages = {4},
}

@misc{wikipedia_contributors_zfs_2024,
	title = {{ZFS}},
	url = {https://en.wikipedia.org/wiki/ZFS},
	abstract = {ZFS is a combined file system and logical volume manager designed by Sun Microsystems. It is known for its data integrity, support for high storage capacities, and protection against data corruption. This Wikipedia entry provides an overview of its history, features, and applications.},
	author = {{Wikipedia contributors}},
	year = {2024},
}

@book{project_zfs_2024,
	title = {{ZFS} {Administration} {Guide}},
	url = {https://openzfs.github.io/openzfs-docs/man/master/8/zfs.8.html},
	abstract = {The ZFS administration guide provides detailed documentation on managing ZFS, a robust file system and volume manager for high-performance computing environments. It covers various commands for managing file systems, snapshots, and data integrity.},
	author = {Project, OpenZFS},
	year = {2024},
}

@inproceedings{liang_daos_2020,
	address = {Berlin, Heidelberg},
	title = {{DAOS}: {A} {Scale}-{Out} {High} {Performance} {Storage} {Stack} for {Storage} {Class} {Memory}},
	isbn = {978-3-030-48841-3},
	url = {https://doi.org/10.1007/978-3-030-48842-0_3},
	doi = {10.1007/978-3-030-48842-0_3},
	abstract = {The Distributed Asynchronous Object Storage (DAOS) is an open source scale-out storage system that is designed from the ground up to support Storage Class Memory (SCM) and NVMe storage in user space. Its advanced storage API enables the native support of structured, semi-structured and unstructured data models, overcoming the limitations of traditional POSIX based parallel filesystem. For HPC workloads, DAOS provides direct MPI-IO and HDF5 support as well as POSIX access for legacy applications. In this paper we present the architecture of the DAOS storage engine and its high-level application interfaces. We also describe initial performance results of DAOS for IO500 benchmarks.},
	booktitle = {Supercomputing {Frontiers}: 6th {Asian} {Conference}, {SCFA} 2020, {Singapore}, {February} 24–27, 2020, {Proceedings}},
	publisher = {Springer-Verlag},
	author = {Liang, Zhen and Lombardi, Johann and Chaarawi, Mohamad and Hennecke, Michael},
	year = {2020},
	note = {event-place: Singapore, Singapore},
	keywords = {DAOS, Distributed storage system, NVMe, Parallel filesystem, Persistent memory, RAFT, SCM, SWIM},
	pages = {40--54},
}

@misc{laboratory_llnl_scalable_2024,
	title = {Scalable {Checkpoint}/{Restart} for {MPI} ({SCR})},
	url = {https://computing.llnl.gov/projects/scalable-checkpoint-restart-for-mpi},
	abstract = {The Scalable Checkpoint/Restart (SCR) library enables efficient, scalable checkpointing of MPI applications. This project from LLNL focuses on reducing checkpoint overhead to improve resilience in high-performance computing environments.},
	author = {Laboratory (LLNL), Lawrence Livermore National},
	year = {2024},
}

@misc{fault_tolerance_working_group_mpi_forum_user_2024,
	title = {User {Level} {Failure} {Mitigation} ({ULFM})},
	url = {https://fault-tolerance.org/},
	abstract = {The User Level Failure Mitigation (ULFM) proposal is developed by the MPI Forum’s Fault Tolerance Working Group to support the continued operation of MPI programs after crash (node failures) have impacted the execution. The key principle is that no MPI call (point-to-point, collective, RMA, IO, …) can block indefinitely after a failure, but must either succeed or raise an MPI error. In addition the design is centered around user needs and flexibility, the API should allow varied fault tolerant models to be built as external libraries.},
	author = {{Fault Tolerance Working Group, MPI Forum}},
	year = {2024},
	keywords = {fault tolerance, resilience},
}

@book{fti_documentation_team_fti_2024,
	title = {{FTI}: {Fault} {Tolerance} {Interface} - {Examples}},
	url = {https://fault-tolerance-interface.readthedocs.io/en/latest/examples.html},
	abstract = {This webpage provides examples of how to use the Fault Tolerance Interface (FTI) for implementing fault tolerance in HPC applications. The examples demonstrate checkpointing, recovery, and handling failures with FTI.},
	author = {{FTI Documentation Team}},
	year = {2024},
	keywords = {fault tolerance, resilience},
}

@inproceedings{koziol_extreme_2012,
	title = {Extreme {I}/{O} {Scaling} with {HDF5}},
	url = {https://cscads.rice.edu/HDF5-CScADS.pdf},
	booktitle = {{XSEDE} 12 - {Extreme} {Scaling} {Workshop}},
	publisher = {The HDF Group},
	author = {Koziol, Quincey},
	year = {2012},
}

@inproceedings{bautista-gomez_fti_2011,
	address = {New York, NY, USA},
	series = {{SC} '11},
	title = {{FTI}: high performance fault tolerance interface for hybrid systems},
	isbn = {978-1-4503-0771-0},
	url = {https://doi.org/10.1145/2063384.2063427},
	doi = {10.1145/2063384.2063427},
	abstract = {Large scientific applications deployed on current petascale systems expend a significant amount of their execution time dumping checkpoint files to remote storage. New fault tolerant techniques will be critical to efficiently exploit post-petascale systems. In this work, we propose a low-overhead high-frequency multi-level checkpoint technique in which we integrate a highly-reliable topology-aware Reed-Solomon encoding in a three-level checkpoint scheme. We efficiently hide the encoding time using one Fault-Tolerance dedicated thread per node. We implement our technique in the Fault Tolerance Interface FTI. We evaluate the correctness of our performance model and conduct a study of the reliability of our library. To demonstrate the performance of FTI, we present a case study of the Mw9.0 Tohoku Japan earthquake simulation with SPECFEM3D on TSUBAME2.0. We demonstrate a checkpoint overhead as low as 8\% on sustained 0.1 petaflops runs (1152 GPUs) while checkpointing at high frequency.},
	booktitle = {Proceedings of 2011 {International} {Conference} for {High} {Performance} {Computing}, {Networking}, {Storage} and {Analysis}},
	publisher = {Association for Computing Machinery},
	author = {Bautista-Gomez, Leonardo and Tsuboi, Seiji and Komatitsch, Dimitri and Cappello, Franck and Maruyama, Naoya and Matsuoka, Satoshi},
	year = {2011},
	note = {event-place: Seattle, Washington},
}

@misc{open_mpi_documentation_team_user_2024,
	title = {User {Level} {Failure} {Mitigation} ({ULFM}) in {Open} {MPI}},
	url = {https://docs.open-mpi.org/en/v5.0.x/features/ulfm.html},
	abstract = {This chapter documents the features and options specific to the User Level Failure Mitigation (ULFM) Open MPI implementation. The ULFM proposal is developed by the MPI Forum’s Fault Tolerance Working Group to support the continued operation of MPI programs after failures, both hard and soft, have impacted execution. No MPI call can block indefinitely after a failure, and errors are not necessarily fatal, as the MPI implementation makes a best effort to maintain the execution environment.},
	author = {{Open MPI Documentation Team}},
	year = {2024},
	keywords = {fault tolerance, resilience},
}

@inproceedings{ouertatani_accelerated_2024,
	address = {Lugano, Switzerland},
	title = {Accelerated {NAS} via pretrained ensembles and multi-fidelity {Bayesian} {Optimization}},
	url = {https://hal.science/hal-04611343},
	booktitle = {33rd {International} {Conference} on {Artificial} {Neural} {Networks} ({ICANN})},
	author = {Ouertatani, Houssem and Maxim, Cristian and Niar, Smail and Talbi, El-Ghazali},
	month = sep,
	year = {2024},
	keywords = {Deep Ensembles, Multi-fidelity BO, Neural Architecture Search},
}

@unpublished{beuzeville_deterministic_2024,
	title = {Deterministic and probabilistic backward error analysis of neural networks in floating-point arithmetic},
	url = {https://hal.science/hal-04663142},
	author = {Beuzeville, Théo and Buttari, Alfredo and Gratton, Serge and Mary, Theo},
	month = jul,
	year = {2024},
	keywords = {artificial neural networks, backward error, error analysis, floating-point arithmetic, probabilistic error analysis, rounding errors},
}

@unpublished{buttari_modular_2024,
	title = {A modular framework for the backward error analysis of {GMRES}},
	url = {https://hal.science/hal-04525918},
	author = {Buttari, Alfredo and Higham, Nicholas J and Mary, Théo and Vieublé, Bastien},
	month = mar,
	year = {2024},
	keywords = {Computer arithmetic, GMRES, Iterative solvers, Linear system of equations, Rounding error analysis},
}

@article{saigre_model_2024,
	title = {Model order reduction and sensitivity analysis for complex heat transfer simulations inside the human eyeball},
	url = {https://hal.science/hal-04361954},
	doi = {10.1002/cnm.3864},
	journal = {International Journal for Numerical Methods in Biomedical Engineering},
	author = {Saigre, Thomas and Prud'Homme, Christophe and Szopos, Marcela},
	month = sep,
	year = {2024},
	note = {Publisher: John Wiley and Sons},
	keywords = {Heat transfer, Mathematical and computational ophthalmology, Sensitivity analysis, Uncertainty qualification, Validation, real-time model order reduction},
	pages = {e3864},
}

@unpublished{aghili_accelerating_2024,
	title = {Accelerating the convergence of {Newton}'s method for nonlinear elliptic {PDEs} using {Fourier} neural operators},
	url = {https://hal.science/hal-04440076},
	author = {Aghili, Joubine and Hild, Romain and Michel-Dansac, Victor and Vigon, Vincent and Franck, Emmanuel},
	month = feb,
	year = {2024},
	keywords = {Fourier neural operators, Neural operators, Newton's method, Nonlinear elliptic PDEs},
}

@article{pham_numerical_2024,
	title = {Numerical investigation of stabilization in the {Hybridizable} {Discontinuous} {Galerkin} method for linear anisotropic elastic equation},
	url = {https://hal.science/hal-04503407},
	doi = {10.1016/j.cma.2024.117080},
	journal = {Computer Methods in Applied Mechanics and Engineering},
	author = {Pham, Ha and Faucher, Florian and Barucq, Hélène},
	month = jun,
	year = {2024},
	note = {Publisher: Elsevier},
	pages = {117080},
}

@unpublished{mary_error_2024,
	title = {Error analysis of matrix multiplication with narrow range floating-point arithmetic},
	url = {https://hal.science/hal-04671474},
	author = {Mary, Théo and Mikaitis, Mantas},
	month = aug,
	year = {2024},
	keywords = {GPUs, floating-point arithmetic, matrix multiplication, mixed precision, multiword arithmetic, overflow, reduced precision, rounding error analysis, scaling, underflow},
}

@unpublished{mary_error_2024-1,
	title = {Error analysis of the {Gram} low-rank approximation (and why it is not as unstable as one may think)},
	url = {https://hal.science/hal-04554516},
	author = {Mary, Théo},
	month = apr,
	year = {2024},
	keywords = {Gram matrix, eigenvalue decomposition, finite precision arithmetic, iterative refinement, low-rank approximation, mixed precision, rounding error analysis, singular value decomposition},
}

@unpublished{prudhomme_ktirio_2024,
	title = {Ktirio {Urban} {Building}: {A} {Computational} {Framework} for {City} {Energy} {Simulations} {Enhanced} by {CI}/{CD} {Innovations} on {EuroHPC} {Systems}},
	url = {https://hal.science/hal-04590586},
	author = {Prud'Homme, Christophe and Chabannes, Vincent and Berti, Luca and Maslek, Maryam and Pincon, Philippe and Cladellas, Javier and Diallo, Abdoulaye},
	month = may,
	year = {2024},
	keywords = {City Energy Simulation, HPC, HPC HPCOps Urban building City Energy Simulation, HPCOps, Urban building},
}

@misc{noauthor_notitle_nodate,
}

@misc{belieres--frendo_volume-preserving_2024,
	title = {Volume-preserving geometric shape optimization of the {Dirichlet} energy using variational neural networks},
	url = {http://arxiv.org/abs/2407.19064},
	abstract = {In this work, we explore the numerical solution of geometric shape optimization problems using neural network-based approaches. This involves minimizing a numerical criterion that includes solving a partial differential equation with respect to a domain, often under geometric constraints like constant volume. Our goal is to develop a proof of concept using a flexible and parallelizable methodology to tackle these problems. We focus on a prototypal problem: minimizing the so-called Dirichlet energy with respect to the domain under a volume constraint, involving a Poisson equation in \${\textbackslash}mathbb R{\textasciicircum}2\$. We use physics-informed neural networks (PINN) to approximate the Poisson equation's solution on a given domain and represent the shape through a neural network that approximates a volume-preserving transformation from an initial shape to an optimal one. These processes are combined in a single optimization algorithm that minimizes the Dirichlet energy. One of the significant advantages of this approach is its parallelizable nature, which makes it easy to handle the addition of parameters. Additionally, it does not rely on shape derivative or adjoint calculations. Our approach is tested on Dirichlet and Robin boundary conditions, parametric right-hand sides, and extended to Bernoulli-type free boundary problems. The source code for solving the shape optimization problem is open-source and freely available.},
	urldate = {2024-09-17},
	publisher = {arXiv},
	author = {Bélières--Frendo, Amaury and Franck, Emmanuel and Michel-Dansac, Victor and Privat, Yannick},
	month = aug,
	year = {2024},
	note = {arXiv:2407.19064 [cs, math]},
	keywords = {Mathematics - Numerical Analysis, Mathematics - Optimization and Control},
}

@article{hecht_new_2012,
	title = {New development in {FreeFem}++},
	volume = {20},
	issn = {1570-2820},
	url = {https://freefem.org/},
	number = {3-4},
	journal = {Journal of Numerical Mathematics},
	author = {Hecht, F.},
	year = {2012},
	mrnumber = {3043640},
	pages = {251--265},
}

@inproceedings{gamblin_spack_2015,
	address = {Austin Texas},
	title = {The {Spack} package manager: bringing order to {HPC} software chaos},
	isbn = {978-1-4503-3723-6},
	shorttitle = {The {Spack} package manager},
	url = {https://dl.acm.org/doi/10.1145/2807591.2807623},
	doi = {10.1145/2807591.2807623},
	language = {en},
	urldate = {2024-09-05},
	booktitle = {Proceedings of the {International} {Conference} for {High} {Performance} {Computing}, {Networking}, {Storage} and {Analysis}},
	publisher = {ACM},
	author = {Gamblin, Todd and LeGendre, Matthew and Collette, Michael R. and Lee, Gregory L. and Moody, Adam and De Supinski, Bronis R. and Futral, Scott},
	month = nov,
	year = {2015},
	pages = {1--12},
}

@article{vallet_toward_2022,
	title = {Toward practical transparent verifiable and long-term reproducible research using {Guix}},
	volume = {9},
	issn = {2052-4463},
	url = {https://www.nature.com/articles/s41597-022-01720-9},
	doi = {10.1038/s41597-022-01720-9},
	abstract = {Abstract
            Reproducibility crisis urge scientists to promote transparency which allows peers to draw same conclusions after performing identical steps from hypothesis to results. Growing resources are developed to open the access to methods, data and source codes. Still, the computational environment, an interface between data and source code running analyses, is not addressed. Environments are usually described with software and library names associated with version labels or provided as an opaque container image. This is not enough to describe the complexity of the dependencies on which they rely to operate on. We describe this issue and illustrate how open tools like Guix can be used by any scientist to share their environment and allow peers to reproduce it. Some steps of research might not be fully reproducible, but at least, transparency for computation is technically addressable. These tools should be considered by scientists willing to promote transparency and open science.},
	language = {en},
	number = {1},
	urldate = {2024-09-05},
	journal = {Scientific Data},
	author = {Vallet, Nicolas and Michonneau, David and Tournier, Simon},
	month = oct,
	year = {2022},
	pages = {597},
}

@techreport{adams_dakota_2022,
	title = {Dakota, {A} {Multilevel} {Parallel} {Object}-{Oriented} {Framework} for {Design} {Optimization}, {Parameter} {Estimation}, {Uncertainty} {Quantification}, and {Sensitivity} {Analysis}: {Version} 6.16 {User}’s {Manual}},
	number = {SAND2022-6171},
	institution = {Sandia National Laboratories},
	author = {Adams, B. M. and Bohnhoff, W. J. and Dalbey, K. R. and Ebeida, M. S. and Eddy, J. P. and Eldred, M. S. and Hooper, R. W. and Hough, P. D. and Hu, K. T. and Jakeman, J. D. and Khalil, M. and Maupin, K. A. and Monschke, J. A. and Ridgway, E. M. and Rushdi, A. A. and Seidl, D. T. and Stephens, J. A. and Swiler, L. P. and Winokur, J. G.},
	month = may,
	year = {2022},
}

@article{faucher_hawen_2021,
	title = {hawen: time-harmonic wave modeling and inversion using hybridizable discontinuous {Galerkin} discretization},
	volume = {6},
	copyright = {http://creativecommons.org/licenses/by/4.0/},
	issn = {2475-9066},
	shorttitle = {hawen},
	url = {https://joss.theoj.org/papers/10.21105/joss.02699},
	doi = {10.21105/joss.02699},
	number = {57},
	urldate = {2024-09-05},
	journal = {Journal of Open Source Software},
	author = {Faucher, Florian},
	month = jan,
	year = {2021},
	pages = {2699},
}

@misc{apptainer_contributors_apptainer_2024,
	title = {Apptainer {User} {Documentation}},
	url = {https://apptainer.org/docs},
	author = {{Apptainer Contributors}},
	year = {2024},
}

@book{slurm_development_team_slurm_2024,
	title = {{SLURM} {Workload} {Manager}},
	url = {https://slurm.schedmd.com/documentation.html},
	author = {{SLURM Development Team}},
	year = {2024},
}

@misc{karakasis_reframe-hpcreframe_2024,
	title = {reframe-hpc/reframe: {ReFrame} 4.6.0},
	url = {https://doi.org/10.5281/zenodo.11002528},
	publisher = {Zenodo},
	author = {Karakasis, Vasileios and Manitaras, Theofilos and Otero, Javier and Koutsaniti, Eirini and {jgp} and {rsarm} and Bignamini, Christopher and {victorusu} and Jocksch, Andreas and {kraushm} and {lucamar} and Keller, Sebastian and Omlin, Samuel and Kliavinek, Sergei and Mendonça, Henrique and Giordano, Mosè and {MarkLTurner} and {GiuseppeLoRe} and Grassano, Davide and Boissonneault, Maxime and Leak, Steve and Paipuri, Mahendra and {jfavre} and {Vanessasaurus} and Morrison, Jack and Moors, Sam and You, Zhi-Qiang and Sandgren, Ake and {brandon-biggs}},
	month = apr,
	year = {2024},
	doi = {10.5281/zenodo.11002528},
}

@article{ballout_nonlinear_2024,
	title = {Nonlinear compressive reduced basis approximation for multi-parameter elliptic problem},
	copyright = {Creative Commons Attribution 4.0 International},
	url = {https://zenodo.org/doi/10.5281/zenodo.13336083},
	doi = {10.5281/ZENODO.13336083},
	abstract = {What's Changed


add citation file by @prudhomm in https://github.com/feelpp/article.nl-c-rbm/pull/4


Full Changelog: https://github.com/feelpp/article.nl-c-rbm/compare/v1.0.1...v1.1.0},
	urldate = {2024-09-04},
	author = {Ballout, Hassan and Maday, Yvon and Prud'homme, Christophe},
	month = aug,
	year = {2024},
	note = {Publisher: Zenodo
Version Number: v1.1.0},
}

@inproceedings{balay_efficient_1997,
	title = {Efficient {Management} of {Parallelism} in {Object} {Oriented} {Numerical} {Software} {Libraries}},
	booktitle = {Modern {Software} {Tools} in {Scientific} {Computing}},
	publisher = {Birkhäuser Press},
	author = {Balay, Satish and Gropp, William D. and McInnes, Lois Curfman and Smith, Barry F.},
	editor = {Arge, E. and Bruaset, A. M. and Langtangen, H. P.},
	year = {1997},
	pages = {163--202},
}

@article{zhang_petscsf_2022,
	title = {The {PetscSF} {Scalable} {Communication} {Layer}},
	volume = {33},
	number = {4},
	journal = {IEEE Transactions on Parallel and Distributed Systems},
	author = {Zhang, Junchao and Brown, Jed and Balay, Satish and Faibussowitsch, Jacob and Knepley, Matthew and Marin, Oana and Mills, Richard Tran and Munson, Todd and Smith, Barry F. and Zampini, Stefano},
	year = {2022},
	pages = {842--853},
}

@article{dalcin_parallel_2011,
	title = {Parallel distributed computing using {Python}},
	volume = {34},
	issn = {0309-1708},
	doi = {10.1016/j.advwatres.2011.04.013},
	number = {9},
	journal = {Advances in Water Resources},
	author = {Dalcin, Lisandro D. and Paz, Rodrigo R. and Kler, Pablo A. and Cosimo, Alejandro},
	year = {2011},
	pages = {1124 -- 1139},
}

@techreport{balay_petsctao_2024,
	title = {{PETSc}/{TAO} {Users} {Manual}},
	number = {ANL-21/39 - Revision 3.21},
	institution = {Argonne National Laboratory},
	author = {Balay, Satish and Abhyankar, Shrirang and Adams, Mark F. and Benson, Steven and Brown, Jed and Brune, Peter and Buschelman, Kris and Constantinescu, Emil and Dalcin, Lisandro and Dener, Alp and Eijkhout, Victor and Faibussowitsch, Jacob and Gropp, William D. and Hapla, Václav and Isaac, Tobin and Jolivet, Pierre and Karpeev, Dmitry and Kaushik, Dinesh and Knepley, Matthew G. and Kong, Fande and Kruger, Scott and May, Dave A. and McInnes, Lois Curfman and Mills, Richard Tran and Mitchell, Lawrence and Munson, Todd and Roman, Jose E. and Rupp, Karl and Sanan, Patrick and Sarich, Jason and Smith, Barry F. and Zampini, Stefano and Zhang, Hong and Zhang, Hong and Zhang, Junchao},
	year = {2024},
	doi = {10.2172/2205494},
}

@misc{ootomo_dgemm_2024,
	title = {{DGEMM} on {Integer} {Matrix} {Multiplication} {Unit}},
	url = {http://arxiv.org/abs/2306.11975},
	abstract = {Deep learning hardware achieves high throughput and low power consumption by reducing computing precision and specializing in matrix multiplication. For machine learning inference, fixed-point value computation is commonplace, where the input and output values and the model parameters are quantized. Thus, many processors are now equipped with fast integer matrix multiplication units (IMMU). It is of significant interest to find a way to harness these IMMUs to improve the performance of HPC applications while maintaining accuracy. We focus on the Ozaki scheme, which computes a high-precision matrix multiplication by using lower-precision computing units, and show the advantages and disadvantages of using IMMU. The experiment using integer Tensor Cores shows that we can compute double-precision matrix multiplication faster than cuBLAS and an existing Ozaki scheme implementation on FP16 Tensor Cores on NVIDIA consumer GPUs. Furthermore, we demonstrate accelerating a quantum circuit simulation by up to 4.33 while maintaining the FP64 accuracy.},
	urldate = {2024-06-28},
	publisher = {arXiv},
	author = {Ootomo, Hiroyuki and Ozaki, Katsuhisa and Yokota, Rio},
	month = mar,
	year = {2024},
	note = {arXiv:2306.11975 [cs]},
	keywords = {Computer Science - Distributed, Parallel, and Cluster Computing},
}

@inproceedings{haidar_harnessing_2018,
	address = {Dallas, TX, USA},
	title = {Harnessing {GPU} {Tensor} {Cores} for {Fast} {FP16} {Arithmetic} to {Speed} up {Mixed}-{Precision} {Iterative} {Refinement} {Solvers}},
	isbn = {978-1-5386-8384-2},
	url = {https://ieeexplore.ieee.org/document/8665777/},
	doi = {10.1109/SC.2018.00050},
	urldate = {2024-06-28},
	booktitle = {{SC18}: {International} {Conference} for {High} {Performance} {Computing}, {Networking}, {Storage} and {Analysis}},
	publisher = {IEEE},
	author = {Haidar, Azzam and Tomov, Stanimire and Dongarra, Jack and Higham, Nicholas J.},
	month = nov,
	year = {2018},
	pages = {603--613},
}