% IMPORTANT: The following is UTF-8 encoded. This means that in the presence
% of non-ASCII characters, it will not work with BibTeX 0.99 or older.
% Instead, you should use an up-to-date BibTeX implementation like “bibtex8” or
% “biber”.
@MISC{Herten:1034807,
author = {Herten, Andreas and Meinke, Jan and Haghighi Mood, Kaveh
and Kraus, Jiri and Hrywniak, Markus},
title = {{GPU} {P}rogramming {P}art 1: {F}oundations},
reportid = {FZJ-2024-07560},
year = {2024},
abstract = {GPU-accelerated computing drives current scientific
research. Writing fast numeric algorithms for GPUs offers
high application performance by offloading compute-intensive
portions of the code to a GPU.The course will cover aspects
of GPU architectures and programming. Focus is on the usage
of the parallel programming language CUDA C++, which allows
maximum control of NVIDIA GPU hardware. Examples of
increasing complexity are used to demonstrate optimization
and tuning of scientific applications.This course is a basic
course covering the foundations of GPU programming including
an introduction to GPU/parallel computing, programming with
CUDA, GPU libraries, tools for debugging and profiling, and
performance optimizations.Topics covered will include
Introduction to GPUs and GPU computing, programming model
CUDA, tools for debugging and profiling, GPU libraries (like
cuBLAS, cuFFT), and introduction to nulti-GPU programming.},
month = {Apr},
date = {2024-04-08},
organization = {JSC - as part of the Training
Programme of Forschungszentrum Jülich,
Jülich (Germany), 8 Apr 2024 - 10 Apr
2024},
subtyp = {Other},
cin = {JSC},
cid = {I:(DE-Juel1)JSC-20090406},
pnm = {5111 - Domain-Specific Simulation $\&$ Data Life Cycle Labs
(SDLs) and Research Groups (POF4-511) / 5112 - Cross-Domain
Algorithms, Tools, Methods Labs (ATMLs) and Research Groups
(POF4-511) / 5122 - Future Computing $\&$ Big Data Systems
(POF4-512) / ATML-X-DEV - ATML Accelerating Devices
(ATML-X-DEV)},
pid = {G:(DE-HGF)POF4-5111 / G:(DE-HGF)POF4-5112 /
G:(DE-HGF)POF4-5122 / G:(DE-Juel-1)ATML-X-DEV},
typ = {PUB:(DE-HGF)17},
doi = {10.34734/FZJ-2024-07560},
url = {https://juser.fz-juelich.de/record/1034807},
}