@article{33684,
  author       = {{Schade, Robert and Kenter, Tobias and Elgabarty, Hossam and Lass, Michael and Schütt, Ole and Lazzaro, Alfio and Pabst, Hans and Mohr, Stephan and Hutter, Jürg and Kühne, Thomas and Plessl, Christian}},
  issn         = {{0167-8191}},
  journal      = {{Parallel Computing}},
  keywords     = {{Artificial Intelligence, Computer Graphics and Computer-Aided Design, Computer Networks and Communications, Hardware and Architecture, Theoretical Computer Science, Software}},
  publisher    = {{Elsevier BV}},
  title        = {{{Towards electronic structure-based ab-initio molecular dynamics simulations with hundreds of millions of atoms}}},
  doi          = {{10.1016/j.parco.2022.102920}},
  volume       = {{111}},
  year         = {{2022}},
}

@article{27364,
  author       = {{Meyer, Marius and Kenter, Tobias and Plessl, Christian}},
  issn         = {{0743-7315}},
  journal      = {{Journal of Parallel and Distributed Computing}},
  title        = {{{In-depth FPGA Accelerator Performance Evaluation with Single Node Benchmarks from the HPC Challenge Benchmark Suite for Intel and Xilinx FPGAs using OpenCL}}},
  doi          = {{10.1016/j.jpdc.2021.10.007}},
  year         = {{2022}},
}

@article{44088,
  abstract     = {{Hole polarons and defect-bound exciton polarons in lithium niobate are investigated by means of density-functional theory, where the localization of the holes is achieved by applying the +U approach to the oxygen 2p orbitals. We find three principal configurations of hole polarons: (i) self-trapped holes localized at displaced regular oxygen atoms and (ii) two other configurations bound to a lithium vacancy either at a threefold coordinated oxygen atom above or at a two-fold coordinated oxygen atom below the defect. The latter is the most stable and is in excellent quantitative agreement with measured g factors from electron paramagnetic resonance. Due to the absence of mid-gap states, none of these hole polarons can explain the broad optical absorption centered between 2.5 and 2.8 eV that is observed in transient absorption spectroscopy, but such states appear if a free electron polaron is trapped at the same lithium vacancy as the bound hole polaron, resulting in an exciton polaron. The dielectric function calculated by solving the Bethe–Salpeter equation indeed yields an optical peak at 2.6 eV in agreement with the two-photon experiments. The coexistence of hole and exciton polarons, which are simultaneously created in optical excitations, thus satisfactorily explains the reported experimental data.}},
  author       = {{Schmidt, Falko and Kozub, Agnieszka L. and Gerstmann, Uwe and Schmidt, Wolf Gero and Schindlmayr, Arno}},
  issn         = {{2073-4352}},
  journal      = {{Crystals}},
  number       = {{11}},
  publisher    = {{MDPI AG}},
  title        = {{{A density-functional theory study of hole and defect-bound exciton polarons in lithium niobate}}},
  doi          = {{10.3390/cryst12111586}},
  volume       = {{12}},
  year         = {{2022}},
}

@article{40371,
  abstract     = {{<jats:p>Multimode integrated interferometers have great potential for both spectral engineering and metrological applications. However, the material dispersion of integrated platforms constitutes an obstacle that limits the performance and precision of such interferometers. At the same time, two-colour nonlinear interferometers present an important tool for metrological applications, when measurements in a certain frequency range are difficult. In this manuscript, we theoretically developed and investigated an integrated multimode two-colour SU(1,1) interferometer operating in a supersensitive mode. By ensuring the proper design of the integrated platform, we suppressed the dispersion, thereby significantly increasing the visibility of the interference pattern. The use of a continuous wave pump laser provided the symmetry between the spectral shapes of the signal and idler photons concerning half the pump frequency, despite different photon colours. We demonstrate that such an interferometer overcomes the classical phase sensitivity limit for wide parametric gain ranges, when up to 3×104 photons are generated.</jats:p>}},
  author       = {{Ferreri, Alessandro and Sharapova, Polina R.}},
  issn         = {{2073-8994}},
  journal      = {{Symmetry}},
  keywords     = {{Physics and Astronomy (miscellaneous), General Mathematics, Chemistry (miscellaneous), Computer Science (miscellaneous)}},
  number       = {{3}},
  publisher    = {{MDPI AG}},
  title        = {{{Two-Colour Spectrally Multimode Integrated SU(1,1) Interferometer}}},
  doi          = {{10.3390/sym14030552}},
  volume       = {{14}},
  year         = {{2022}},
}

@article{28099,
  abstract     = {{N-body methods are one of the essential algorithmic building blocks of high-performance and parallel computing. Previous research has shown promising performance for implementing n-body simulations with pairwise force calculations on FPGAs. However, to avoid challenges with accumulation and memory access patterns, the presented designs calculate each pair of forces twice, along with both force sums of the involved particles. Also, they require large problem instances with hundreds of thousands of particles to reach their respective peak performance, limiting the applicability for strong scaling scenarios. This work addresses both issues by presenting a novel FPGA design that uses each calculated force twice and overlaps data transfers and computations in a way that allows to reach peak performance even for small problem instances, outperforming previous single precision results even in double precision, and scaling linearly over multiple interconnected FPGAs. For a comparison across architectures, we provide an equally optimized CPU reference, which for large problems actually achieves higher peak performance per device, however, given the strong scaling advantages of the FPGA design, in parallel setups with few thousand particles per device, the FPGA platform achieves highest performance and power efficiency.}},
  author       = {{Menzel, Johannes and Plessl, Christian and Kenter, Tobias}},
  issn         = {{1936-7406}},
  journal      = {{ACM Transactions on Reconfigurable Technology and Systems}},
  number       = {{1}},
  pages        = {{1--30}},
  title        = {{{The Strong Scaling Advantage of FPGAs in HPC for N-body Simulations}}},
  doi          = {{10.1145/3491235}},
  volume       = {{15}},
  year         = {{2021}},
}

@inproceedings{27365,
  author       = {{Meyer, Marius}},
  booktitle    = {{Proceedings of the 11th International Symposium on Highly Efficient Accelerators and Reconfigurable Technologies}},
  title        = {{{Towards Performance Characterization of FPGAs in Context of HPC using OpenCL Benchmarks}}},
  doi          = {{10.1145/3468044.3468058}},
  year         = {{2021}},
}

@inproceedings{20886,
  author       = {{Nickchen, Tobias and Heindorf, Stefan and Engels, Gregor}},
  booktitle    = {{Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision}},
  location     = {{Hawaii}},
  pages        = {{1994--2002}},
  title        = {{{Generating Physically Sound Training Data for Image Recognition of Additively Manufactured Parts}}},
  year         = {{2021}},
}

@article{32243,
  abstract     = {{<jats:title>Abstract</jats:title>
               <jats:p>The defining feature of active particles is that they constantly propel themselves by locally converting chemical energy into directed motion. This active self-propulsion prevents them from equilibrating with their thermal environment (e.g. an aqueous solution), thus keeping them permanently out of equilibrium. Nevertheless, the spatial dynamics of active particles might share certain equilibrium features, in particular in the steady state. We here focus on the time-reversal symmetry of individual spatial trajectories as a distinct equilibrium characteristic. We investigate to what extent the steady-state trajectories of a trapped active particle obey or break this time-reversal symmetry. Within the framework of active Ornstein–Uhlenbeck particles we find that the steady-state trajectories in a harmonic potential fulfill path-wise time-reversal symmetry exactly, while this symmetry is typically broken in anharmonic potentials.</jats:p>}},
  author       = {{Dabelow, Lennart and Bo, Stefano and Eichhorn, Ralf}},
  issn         = {{1742-5468}},
  journal      = {{Journal of Statistical Mechanics: Theory and Experiment}},
  keywords     = {{Statistics, Probability and Uncertainty, Statistics and Probability, Statistical and Nonlinear Physics}},
  number       = {{3}},
  publisher    = {{IOP Publishing}},
  title        = {{{How irreversible are steady-state trajectories of a trapped active particle?}}},
  doi          = {{10.1088/1742-5468/abe6fd}},
  volume       = {{2021}},
  year         = {{2021}},
}

@unpublished{32244,
  abstract     = {{We push the boundaries of electronic structure-based \textit{ab-initio}
molecular dynamics (AIMD) beyond 100 million atoms. This scale is otherwise
barely reachable with classical force-field methods or novel neural network and
machine learning potentials. We achieve this breakthrough by combining
innovations in linear-scaling AIMD, efficient and approximate sparse linear
algebra, low and mixed-precision floating-point computation on GPUs, and a
compensation scheme for the errors introduced by numerical approximations. The
core of our work is the non-orthogonalized local submatrix method (NOLSM),
which scales very favorably to massively parallel computing systems and
translates large sparse matrix operations into highly parallel, dense matrix
operations that are ideally suited to hardware accelerators. We demonstrate
that the NOLSM method, which is at the center point of each AIMD step, is able
to achieve a sustained performance of 324 PFLOP/s in mixed FP16/FP32 precision
corresponding to an efficiency of 67.7% when running on 1536 NVIDIA A100 GPUs.}},
  author       = {{Schade, Robert and Kenter, Tobias and Elgabarty, Hossam and Lass, Michael and Schütt, Ole and Lazzaro, Alfio and Pabst, Hans and Mohr, Stephan and Hutter, Jürg and Kühne, Thomas D. and Plessl, Christian}},
  booktitle    = {{arXiv:2104.08245}},
  title        = {{{Towards Electronic Structure-Based Ab-Initio Molecular Dynamics  Simulations with Hundreds of Millions of Atoms}}},
  year         = {{2021}},
}

@inproceedings{29937,
  author       = {{Karp, Martin and Podobas, Artur and Jansson, Niclas and Kenter, Tobias and Plessl, Christian and Schlatter, Philipp and Markidis, Stefano}},
  booktitle    = {{2021 IEEE International Parallel and Distributed Processing Symposium (IPDPS)}},
  publisher    = {{IEEE}},
  title        = {{{High-Performance Spectral Element Methods on Field-Programmable Gate Arrays : Implementation, Evaluation, and Future Projection}}},
  doi          = {{10.1109/ipdps49936.2021.00116}},
  year         = {{2021}},
}

@inproceedings{46194,
  author       = {{Kenter, Tobias and Shambhu, Adesh and Faghih-Naini, Sara and Aizinger, Vadym}},
  booktitle    = {{Proceedings of the Platform for Advanced Scientific Computing Conference (PASC)}},
  publisher    = {{ACM}},
  title        = {{{Algorithm-hardware co-design of a discontinuous Galerkin shallow-water model for a dataflow architecture on FPGA}}},
  doi          = {{10.1145/3468267.3470617}},
  year         = {{2021}},
}

@unpublished{32236,
  abstract     = {{The interaction between quantum light and matter is being intensively studied
for systems that are enclosed in high-$Q$ cavities which strongly enhance the
light-matter coupling. However, for many applications, cavities with lower
$Q$-factors are preferred due to the increased spectral width of the cavity
mode. Here, we investigate the interaction between quantum light and matter
represented by a $\Lambda$-type three-level system in lossy cavities, assuming
that cavity losses are the dominant loss mechanism. We demonstrate that cavity
losses lead to non-trivial steady states of the electronic occupations that can
be controlled by the loss rate and the initial statistics of the quantum
fields. The mechanism of formation of such steady states can be understood on
the basis of the equations of motion. Analytical expressions for steady states
and their numerical simulations are presented and discussed.}},
  author       = {{Rose, H. and Tikhonova, O. V. and Meier, T. and Sharapova, P. }},
  booktitle    = {{arXiv:2109.00842}},
  title        = {{{Steady states of $Λ$-type three-level systems excited by quantum  light in lossy cavities}}},
  year         = {{2021}},
}

@article{46122,
  author       = {{Kaczmarek, Olaf and Mazur, Lukas and Sharma, Sayantan}},
  issn         = {{2470-0010}},
  journal      = {{Physical Review D}},
  number       = {{9}},
  publisher    = {{American Physical Society (APS)}},
  title        = {{{Eigenvalue spectra of QCD and the fate of <mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" display="inline"><mml:msub><mml:mi>U</mml:mi><mml:mi>A</mml:mi></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo stretchy="false">)</mml:mo></mml:math> breaking towards the chiral limit}}},
  doi          = {{10.1103/physrevd.104.094518}},
  volume       = {{104}},
  year         = {{2021}},
}

@article{46124,
  author       = {{Altenkort, Luis and Eller, Alexander M. and Kaczmarek, O. and Mazur, Lukas and Moore, Guy D. and Shu, H.-T.}},
  issn         = {{2470-0010}},
  journal      = {{Physical Review D}},
  number       = {{1}},
  publisher    = {{American Physical Society (APS)}},
  title        = {{{Heavy quark momentum diffusion from the lattice using gradient flow}}},
  doi          = {{10.1103/physrevd.103.014511}},
  volume       = {{103}},
  year         = {{2021}},
}

@article{46123,
  author       = {{Altenkort, Luis and Eller, Alexander M. and Kaczmarek, O. and Mazur, Lukas and Moore, Guy D. and Shu, H.-T.}},
  issn         = {{2470-0010}},
  journal      = {{Physical Review D}},
  number       = {{11}},
  publisher    = {{American Physical Society (APS)}},
  title        = {{{Sphaleron rate from Euclidean lattice correlators: An exploration}}},
  doi          = {{10.1103/physrevd.103.114513}},
  volume       = {{103}},
  year         = {{2021}},
}

@inproceedings{46195,
  author       = {{Karp, Martin and Podobas, Artur and Jansson, Niclas and Kenter, Tobias and Plessl, Christian and Schlatter, Philipp and Markidis, Stefano}},
  booktitle    = {{2021 IEEE International Parallel and Distributed Processing Symposium (IPDPS)}},
  publisher    = {{IEEE}},
  title        = {{{High-Performance Spectral Element Methods on Field-Programmable Gate Arrays : Implementation, Evaluation, and Future Projection}}},
  doi          = {{10.1109/ipdps49936.2021.00116}},
  year         = {{2021}},
}

@inbook{21587,
  abstract     = {{Solving partial differential equations on unstructured grids is a cornerstone of engineering and scientific computing. Nowadays, heterogeneous parallel platforms with CPUs, GPUs, and FPGAs enable energy-efficient and computationally demanding simulations. We developed the HighPerMeshes C++-embedded Domain-Specific Language (DSL) for bridging the abstraction gap between the mathematical and algorithmic formulation of mesh-based algorithms for PDE problems on the one hand and an increasing number of heterogeneous platforms with their different parallel programming and runtime models on the other hand. Thus, the HighPerMeshes DSL aims at higher productivity in the code development process for multiple target platforms. We introduce the concepts as well as the basic structure of the HighPerMeshes DSL, and demonstrate its usage with three examples, a Poisson and monodomain problem, respectively, solved by the continuous finite element method, and the discontinuous Galerkin method for Maxwell’s equation. The mapping of the abstract algorithmic description onto parallel hardware, including distributed memory compute clusters, is presented. Finally, the achievable performance and scalability are demonstrated for a typical example problem on a multi-core CPU cluster.}},
  author       = {{Alhaddad, Samer and Förstner, Jens and Groth, Stefan and Grünewald, Daniel and Grynko, Yevgen and Hannig, Frank and Kenter, Tobias and Pfreundt, Franz-Josef and Plessl, Christian and Schotte, Merlind and Steinke, Thomas and Teich, Jürgen and Weiser, Martin and Wende, Florian}},
  booktitle    = {{Euro-Par 2020: Parallel Processing Workshops}},
  isbn         = {{9783030715922}},
  issn         = {{0302-9743}},
  keywords     = {{tet_topic_hpc}},
  title        = {{{HighPerMeshes – A Domain-Specific Language for Numerical Algorithms on Unstructured Grids}}},
  doi          = {{10.1007/978-3-030-71593-9_15}},
  year         = {{2021}},
}

@inbook{29936,
  author       = {{Ramaswami, Arjun and Kenter, Tobias and Kühne, Thomas and Plessl, Christian}},
  booktitle    = {{Applied Reconfigurable Computing. Architectures, Tools, and Applications}},
  isbn         = {{9783030790240}},
  issn         = {{0302-9743}},
  publisher    = {{Springer International Publishing}},
  title        = {{{Evaluating the Design Space for Offloading 3D FFT Calculations to an FPGA for High-Performance Computing}}},
  doi          = {{10.1007/978-3-030-79025-7_21}},
  year         = {{2021}},
}

@article{24788,
  author       = {{Alhaddad, Samer and Förstner, Jens and Groth, Stefan and Grünewald, Daniel and Grynko, Yevgen and Hannig, Frank and Kenter, Tobias and Pfreundt, Franz‐Josef and Plessl, Christian and Schotte, Merlind and Steinke, Thomas and Teich, Jürgen and Weiser, Martin and Wende, Florian}},
  issn         = {{1532-0626}},
  journal      = {{Concurrency and Computation: Practice and Experience}},
  keywords     = {{tet_topic_hpc}},
  pages        = {{e6616}},
  title        = {{{The HighPerMeshes framework for numerical algorithms on unstructured grids}}},
  doi          = {{10.1002/cpe.6616}},
  year         = {{2021}},
}

@article{32240,
  abstract     = {{<p>The effect of traces of ethanol in supercritical carbon dioxide on the mixture's thermodynamic properties is studied by molecular simulations and Taylor dispersion measurements.</p>}},
  author       = {{Chatwell, René Spencer and Guevara-Carrion, Gabriela and Gaponenko, Yuri and Shevtsova, Valentina and Vrabec, Jadran}},
  issn         = {{1463-9076}},
  journal      = {{Physical Chemistry Chemical Physics}},
  keywords     = {{Physical and Theoretical Chemistry, General Physics and Astronomy}},
  number       = {{4}},
  pages        = {{3106--3115}},
  publisher    = {{Royal Society of Chemistry (RSC)}},
  title        = {{{Diffusion of the carbon dioxide–ethanol mixture in the extended critical region}}},
  doi          = {{10.1039/d0cp04985a}},
  volume       = {{23}},
  year         = {{2021}},
}

