@inproceedings{3d3820b20bfc4e38a30a81ec39838b40,
title = "DTF: An I/O arbitration framework for multi-component data processing workflows",
abstract = "Multi-component workflows, where one component performs a particular transformation with the data and passes it on to the next component, is a common way of performing complex computations. Using components as building blocks we can apply sophisticated data processing algorithms to large volumes of data. Because the components may be developed independently, they often use file I/O and the Parallel File System to pass data. However, as the data volume increases, file I/O quickly becomes the bottleneck in such workflows. In this work, we propose an I/O arbitration framework called DTF to alleviate this problem by silently replacing file I/O with direct data transfer between the components. DTF treats file I/O calls as I/O requests and performs I/O request matching to perform data movement. Currently, the framework works with PnetCDF-based multi-component workflows. It requires minimal modifications to applications and allows the user to easily control I/O flow via the framework{\textquoteright}s configuration file.",
keywords = "I/O arbitration, I/O performance, Multi-component workflow, Workflow coupling",
author = "Martsinkevich, {Tatiana V.} and Balazs Gerofi and Lien, {Guo Yuan} and Seiya Nishizawa and Liao, {Wei keng} and Takemasa Miyoshi and Hirofumi Tomita and Yutaka Ishikawa and Alok Choudhary",
note = "Publisher Copyright: {\textcopyright} 2018, Springer International Publishing AG, part of Springer Nature.; 33rd International Conference on ISC High Performance, 2018 ; Conference date: 24-06-2018 Through 28-06-2018",
year = "2018",
doi = "10.1007/978-3-319-92040-5_4",
language = "English (US)",
isbn = "9783319920399",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "63--80",
editor = "Michele Weiland and David Keyes and Carsten Trinitis and Rio Yokota",
booktitle = "High Performance Computing - 33rd International Conference, ISC High Performance 2018, Proceedings",
}