@inproceedings{4027d819656e41ab886e0f079cde20ed,
title = "A plugin for HDF5 using PLFS for improved I/O performance and semantic analysis",
abstract = "HDF5 is a data model, library and file format for storing and managing data. It is designed for flexible and efficient I/O for high volume and complex data. Natively, it uses a single-file format where multiple HDF5 objects are stored in a single file. In a parallel HDF5 application, multiple processes access a single file, thereby resulting in a performance bottleneck in I/O. Additionally, a single-file format does not allow semantic post processing on individual objects outside the scope of the HDF5 application. We have developed a new plugin for HDF5 using its Virtual Object Layer that serves two purposes: 1) it uses PLFS to convert the single-file layout into a data layout that is optimized for the underlying file system, and 2) it stores data in a unique way that enables semantic post-processing on data. We measure the performance of the plugin and discuss work leveraging the new semantic post-processing functionality enabled. We further discuss the applicability of this approach for exascale burst buffer storage systems.",
keywords = "HDF5, PLFS, Parallel I/O, Semantic Analysis",
author = "Kshitij Mehta and John Bent and Aaron Torres and Gary Grider and Edgar Gabriel",
year = "2012",
doi = "10.1109/SC.Companion.2012.102",
language = "English",
isbn = "9780769549569",
series = "Proceedings - 2012 SC Companion: High Performance Computing, Networking Storage and Analysis, SCC 2012",
pages = "746--752",
booktitle = "Proceedings - 2012 SC Companion",
note = "2012 SC Companion: High Performance Computing, Networking Storage and Analysis, SCC 2012 ; Conference date: 10-11-2012 Through 16-11-2012",
}