% IMPORTANT: The following is UTF-8 encoded. This means that in the presence % of non-ASCII characters, it will not work with BibTeX 0.99 or older. % Instead, you should use an up-to-date BibTeX implementation like “bibtex8” or % “biber”. @MISC{Herten:1034807, author = {Herten, Andreas and Meinke, Jan and Haghighi Mood, Kaveh and Kraus, Jiri and Hrywniak, Markus}, title = {{GPU} {P}rogramming {P}art 1: {F}oundations}, reportid = {FZJ-2024-07560}, year = {2024}, abstract = {GPU-accelerated computing drives current scientific research. Writing fast numeric algorithms for GPUs offers high application performance by offloading compute-intensive portions of the code to a GPU.The course will cover aspects of GPU architectures and programming. Focus is on the usage of the parallel programming language CUDA C++, which allows maximum control of NVIDIA GPU hardware. Examples of increasing complexity are used to demonstrate optimization and tuning of scientific applications.This course is a basic course covering the foundations of GPU programming including an introduction to GPU/parallel computing, programming with CUDA, GPU libraries, tools for debugging and profiling, and performance optimizations.Topics covered will include Introduction to GPUs and GPU computing, programming model CUDA, tools for debugging and profiling, GPU libraries (like cuBLAS, cuFFT), and introduction to nulti-GPU programming.}, month = {Apr}, date = {2024-04-08}, organization = {JSC - as part of the Training Programme of Forschungszentrum Jülich, Jülich (Germany), 8 Apr 2024 - 10 Apr 2024}, subtyp = {Other}, cin = {JSC}, cid = {I:(DE-Juel1)JSC-20090406}, pnm = {5111 - Domain-Specific Simulation $\&$ Data Life Cycle Labs (SDLs) and Research Groups (POF4-511) / 5112 - Cross-Domain Algorithms, Tools, Methods Labs (ATMLs) and Research Groups (POF4-511) / 5122 - Future Computing $\&$ Big Data Systems (POF4-512) / ATML-X-DEV - ATML Accelerating Devices (ATML-X-DEV)}, pid = {G:(DE-HGF)POF4-5111 / G:(DE-HGF)POF4-5112 / G:(DE-HGF)POF4-5122 / G:(DE-Juel-1)ATML-X-DEV}, typ = {PUB:(DE-HGF)17}, doi = {10.34734/FZJ-2024-07560}, url = {https://juser.fz-juelich.de/record/1034807}, }