@inproceedings{73193cf89f314d5fa51e1ebc88d86504,
title = "NumaMMA: NUMA memory analyzer",
abstract = "Non Uniform Memory Access (NUMA) architectures are nowadays common for running High-Performance Computing (HPC) applications. In such architectures, several distinct physical memories are assembled to create a single shared memory. Nevertheless, because there are several physical memories, access times to these memories are not uniform depending on the location of the core performing the memory request and on the location of the target memory. Hence, threads and data placement are crucial to efficiently exploit such architectures. To help in taking decision about this placement, profiling tools are needed. In this work, we propose NUMA MeMory Analyzer (NumaMMA), a new profiling tool for understanding the memory access patterns of HPC applications. NumaMMA combines efficient collection of memory traces using hardware mechanisms with original visualization means allowing to see how memory access patterns evolve over time. The information reported by NumaMMA allows to understand the nature of these access patterns inside each object allocated by the application. We show how NumaMMA can help understanding the memory patterns of several HPC applications in order to optimize them and get speedups up to 28\% over the standard non optimized version.",
keywords = "Data, Memory sampling, NUMA architectures, Performance analysis, Threads placement",
author = "Fran{\c c}ois Trahay and Manuel Selva and Lionel Morel and Kevin Marquet",
note = "Publisher Copyright: {\textcopyright} 2018 Copyright held by the owner/author(s). Publication rights licensed to ACM.; 47th International Conference on Parallel Processing, ICPP 2018 ; Conference date: 14-08-2018 Through 16-08-2018",
year = "2018",
month = aug,
day = "13",
doi = "10.1145/3225058.3225094",
language = "English",
isbn = "9781450365109",
series = "ACM International Conference Proceeding Series",
publisher = "Association for Computing Machinery",
booktitle = "Proceedings of the 47th International Conference on Parallel Processing, ICPP 2018",
}