@inproceedings{54dcfd572bc54aa596e310c0100c86fd,
title = "Flexpath: Type-based publish/subscribe system for large-scale science analytics",
abstract = "As high-end systems move toward exascale sizes, a new model of scientific inquiry being developed is one in which online data analytics run concurrently with the high end simulations producing data outputs. Goals are to gain rapid insights into the ongoing scientific processes, assess their scientific validity, and/or initiate corrective or supplementary actions by launching additional computations when needed. The Flex path system presented in this paper addresses the fundamental problem of how to structure and efficiently implement the communications between high end simulations and concurrently running online data analytics, the latter comprised of componentized dynamic services and service pipelines. Using a type-based publish/subscribe approach, Flexpath encourages diversity by permitting analytics services to differ in their computational and scaling characteristics and even in their internal execution models. Flex path uses direct and MxN connections between interacting services to reduce data movements, to allow for runtime connectivity changes to accommodate component arrivals/departures, and to support the multiple underlying communication protocols used for analytics workflows in which simulation outputs are processed by analytics services residing on the same nodes where they are generated, on the same machine, and/or on attached or remote analytics engines. This paper describes the design and implementation of Flex path, and evaluates it with two widely used scientific applications and their associated data analytics methods.",
keywords = "Code Coupling, Data Analytics, Data Staging, Publish/Subscribe, Scalable I/O, in-Situ",
author = "Jai Dayal and Drew Bratcher and Greg Eisenhauer and Karsten Schwan and Matthew Wolf and Xuechen Zhang and Hasan Abbasi and Scott Klasky and Norbert Podhorszki",
year = "2014",
doi = "10.1109/CCGrid.2014.104",
language = "English",
isbn = "9781479927838",
series = "Proceedings - 14th IEEE/ACM International Symposium on Cluster, Cloud, and Grid Computing, CCGrid 2014",
publisher = "IEEE Computer Society",
pages = "246--255",
booktitle = "Proceedings - 14th IEEE/ACM International Symposium on Cluster, Cloud, and Grid Computing, CCGrid 2014",
note = "14th IEEE/ACM International Symposium on Cluster, Cloud and Grid Computing, CCGrid 2014 ; Conference date: 26-05-2014 Through 29-05-2014",
}