% IMPORTANT: The following is UTF-8 encoded.  This means that in the presence
% of non-ASCII characters, it will not work with BibTeX 0.99 or older.
% Instead, you should use an up-to-date BibTeX implementation like “bibtex8” or
% “biber”.

@ARTICLE{Mohr:9822,
      author       = {Mohr, B. and Wylie, B.J.N. and Wolf, F.},
      title        = {{P}erformance measurement and analysis tools for extremely
                      scalable systems},
      journal      = {Concurrency and computation},
      volume       = {22},
      issn         = {1532-0626},
      address      = {Chichester},
      publisher    = {Wiley},
      reportid     = {PreJuSER-9822},
      pages        = {2212 - 2229},
      year         = {2010},
      note         = {Record converted from VDB: 12.11.2012},
      abstract     = {High-performance computing systems continue to employ more
                      and more processor cores. Current typical high-end machines
                      in industry, university, and government research laboratory
                      computing centers feature thousands of computing cores.
                      While these machines promise ever more compute power and
                      memory capacity to tackle today's complex simulation
                      problems, they force application developers to greatly
                      enhance the scalability of their codes to be able to exploit
                      it. To better support them in their porting and tuning
                      process, many parallel-tools research groups have already
                      started to work on scaling their methods, techniques, and
                      tools to extreme processor counts. In this paper, we survey
                      existing profiling and tracing tools, report on our
                      experience in using them in extreme scaling environments,
                      review working and promising new methods and techniques, and
                      discuss strategies for solving open issues and problems.
                      Copyright (C) 2010 John Wiley $\&$ Sons, Ltd.},
      keywords     = {J (WoSType)},
      cin          = {JSC / JARA-HPC},
      ddc          = {004},
      cid          = {I:(DE-Juel1)JSC-20090406 / $I:(DE-82)080012_20140620$},
      pnm          = {Scientific Computing (FUEK411) / 411 - Computational
                      Science and Mathematical Methods (POF2-411) / ATMLPP - ATML
                      Parallel Performance (ATMLPP)},
      pid          = {G:(DE-Juel1)FUEK411 / G:(DE-HGF)POF2-411 /
                      G:(DE-Juel-1)ATMLPP},
      shelfmark    = {Computer Science, Software Engineering / Computer Science,
                      Theory $\&$ Methods},
      typ          = {PUB:(DE-HGF)16},
      UT           = {WOS:000283958700003},
      doi          = {10.1002/cpe.1585},
      url          = {https://juser.fz-juelich.de/record/9822},
}