BibTeX Export
@ARTICLE{Hermanns_ea:2012:Mpi2RmaAnalysis, author = {Hermanns, Marc-Andr{\'{e}} and Geimer, Markus and Mohr, Bernd and Wolf, Felix}, month = aug, title = {Scalable detection of {MPI}-2 remote memory access inefficiency patterns}, journal = {Intl. Journal of High Performance Computing Applications (IJHPCA)}, volume = {26}, number = {3}, year = {2012}, pages = {227--236}, doi = {10.1177/1094342011406758}, abstract = {Wait states in parallel applications can be identified by scanning event traces for characteristic patterns. In our earlier work we defined such inefficiency patterns for MPI-2 one-sided communication, although still based on a serial trace-analysis scheme with limited scalability. In this article we show how wait states in one-sided communications can be detected in a more scalable fashion by taking advantage of a new scalable trace-analysis approach based on a parallel replay, which was originally developed for MPI-1 point-to-point and collective communication. Moreover, we demonstrate the scalability of our method and its usefulness for the optimization cycle with applications running on up to 32,768 cores.}, eprint={http://hpc.sagepub.com/content/early/2011/06/03/1094342011406758.full.pdf+html},publisher={Sage} }
Copy