@inbook{5832f21506a94bebaa3692482fe96fa3,
title = "An Empirical Method for Processing I/O Traces to Analyze the Performance of DL Applications",
abstract = "The exponential growth of data handled by Deep Learning (DL) applications has led to an unprecedented demand for computational resources, necessitating their execution on High Performance Computing (HPC) systems. However, understanding and optimizing Input/Output (I/O) of the DL applications can be challenging due to the complexity and scale of DL workloads and the heterogeneous nature of I/O operations. This paper addresses this issue by proposing an I/O traces processing method that simplifies the generation of reports on global I/O patterns and performance to aid in I/O performance analysis. Our approach focuses on understanding the temporal and spatial distributions of I/O operations and related with the behavior at I/O system level. The proposed method enables us to synthesize and extract key information from the reports generated by tools such as Darshan tool and the seff command. These reports offer a detailed view of I/O performance, providing a set of metrics that deepen our understanding of the I/O behavior of DL applications.",
keywords = "DL, HPC, I/O Analysis, I/O behavior patterns",
author = "Edixon Parraga and Betzabeth Leon and Sandra Mendez and Dolores Rexachs and Remo Suppi and Emilio Luque",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2025.",
year = "2024",
month = oct,
day = "11",
doi = "10.1007/978-3-031-70807-7\_6",
language = "English",
isbn = "978-3-031-70807-7",
series = "Communications in Computer and Information Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "74--90",
editor = "Marcelo Naiouf and \{De Giusti\}, Laura and Franco Chichizola and Leandro Libutti",
booktitle = "Cloud Computing, Big Data and Emerging Topics - 12th Conference, JCC-BD and ET 2024, Revised Selected Papers",
}