% IMPORTANT: The following is UTF-8 encoded. This means that in the presence
% of non-ASCII characters, it will not work with BibTeX 0.99 or older.
% Instead, you should use an up-to-date BibTeX implementation like “bibtex8” or
% “biber”.
@INPROCEEDINGS{Beckmann:280931,
author = {Beckmann, Andreas and Kabadshow, Ivo},
title = {{P}ortable {N}ode-{L}evel {P}erformance {O}ptimization for
the {F}ast {M}ultipole {M}ethod},
volume = {105},
address = {Cham},
publisher = {Springer International Publishing},
reportid = {FZJ-2016-00642},
isbn = {978-3-319-22996-6},
series = {Lecture Notes in Computational Science and Engineering},
pages = {29 - 46},
year = {2015},
comment = {Recent Trends in Computational Engineering - CE2014},
booktitle = {Recent Trends in Computational
Engineering - CE2014},
abstract = {This article provides an in-depth analysis and high-level
C++ optimization strategies for the most time-consuming
kernels of a Fast Multipole Method (FMM). The two main
kernels of a Coulomb FMM are formulated to support different
hardware features, such as unrolling, vectorization or
threading without the need to rewrite the kernels in
intrinsics or even assembly. The abstract description of the
algorithm automatically allows optimal node-level peak
performance on a broad class of available hardware
platforms. Most of the presented optimization schemes allow
a generic, hence platform-independent description for other
kernels as well.},
month = {Oct},
date = {2014-10-06},
organization = {3rd International Workshop on
Computational Engineering, Stuttgart
(Germany), 6 Oct 2014 - 10 Oct 2014},
cin = {JSC},
ddc = {510},
cid = {I:(DE-Juel1)JSC-20090406},
pnm = {511 - Computational Science and Mathematical Methods
(POF3-511) / GromEx - Highly Scalable Unified Long-Range
Electrostatics and Flexible Ionization for Realistic
Biomolecular Simulations on the Exascale (230673686)},
pid = {G:(DE-HGF)POF3-511 / G:(GEPRIS)230673686},
typ = {PUB:(DE-HGF)8},
doi = {10.1007/978-3-319-22997-3_2},
url = {https://juser.fz-juelich.de/record/280931},
}