How Many Threads will be too Many? On the Scalability of OpenMP Implementations

Iwainsky, Christian; Knobloch, Michael; Calotoiu, Alexandru; Shudler, Sergei; Bischof, Christian; Wolf, Felix; Strube, Alexandre
doi:10.1007/978-3-662-48096-0_35
% IMPORTANT: The following is UTF-8 encoded.  This means that in the presence
% of non-ASCII characters, it will not work with BibTeX 0.99 or older.
% Instead, you should use an up-to-date BibTeX implementation like “bibtex8” or
% “biber”.

@INPROCEEDINGS{Iwainsky:280948,
      author       = {Iwainsky, Christian and Shudler, Sergei and Calotoiu,
                      Alexandru and Strube, Alexandre and Knobloch, Michael and
                      Bischof, Christian and Wolf, Felix},
      title        = {{H}ow {M}any {T}hreads will be too {M}any? {O}n the
                      {S}calability of {O}pen{MP} {I}mplementations},
      volume       = {9233},
      address      = {Berlin, Heidelberg},
      publisher    = {Springer Berlin Heidelberg},
      reportid     = {FZJ-2016-00659},
      isbn         = {978-3-662-48095-3 (print)},
      series       = {Lecture Notes in Computer Science},
      pages        = {451 - 463},
      year         = {2015},
      comment      = {Euro-Par 2015: Parallel Processing / Träff, Jesper Larsson
                      (Editor)},
      booktitle     = {Euro-Par 2015: Parallel Processing /
                       Träff, Jesper Larsson (Editor)},
      abstract     = {Exascale systems will exhibit much higher degrees of
                      parallelism both in terms of the number of nodes and the
                      number of cores per node. OpenMP is a widely used standard
                      for exploiting parallelism on the level of individual nodes.
                      Although successfully used on today’s systems, it is
                      unclear how well OpenMP implementations will scale to much
                      higher numbers of threads. In this work, we apply automated
                      performance modeling to examine the scalability of OpenMP
                      constructs across different compilers and platforms. We ran
                      tests on Intel Xeon multi-board, Intel Xeon Phi, and Blue
                      Gene with compilers from GNU, IBM, Intel, and PGI. The
                      resulting models reveal a number of scalability issues in
                      implementations of OpenMP constructs and show unexpected
                      differences between compilers.},
      month         = {Aug},
      date          = {2015-08-24},
      organization  = {21st International Conference on
                       Parallel and Distributed Computing,
                       Vienna (Austria), 24 Aug 2015 - 28 Aug
                       2015},
      cin          = {JSC},
      ddc          = {004},
      cid          = {I:(DE-Juel1)JSC-20090406},
      pnm          = {511 - Computational Science and Mathematical Methods
                      (POF3-511) / ATMLPP - ATML Parallel Performance (ATMLPP)},
      pid          = {G:(DE-HGF)POF3-511 / G:(DE-Juel-1)ATMLPP},
      typ          = {PUB:(DE-HGF)8},
      UT           = {WOS:000363786800035},
      doi          = {10.1007/978-3-662-48096-0_35},
      url          = {https://juser.fz-juelich.de/record/280948},
}
guest :: login JuSER
		Search		Submit		Personalize Your alerts Your baskets Your searches		Help