@inproceedings{e834e3e8fe094e7980d2dfeeb0168690,
title = "Asterism: Pegasus and Dispel4py Hybrid Workflows for Data-Intensive Science",
abstract = "We present Asterism, an open source data-intensive framework, which combines the strengths of traditional workflow management systems with new parallel stream-based dataflow systems to run data-intensive applications across multiple heterogeneous resources, without users having to: re-formulate their methods according to different enactment engines; manage the data distribution across systems; parallelize their methods; co-place and schedule their methods with computing resources; and store and transfer large/small volumes of data. We also present the Data-Intensive workflows as a Service (DIaaS) model, which enables easy dataintensive workow composition and deployment on clouds using containers. The feasibility of Asterism and DIaaS model have been evaluated using a real domain application on the NSF-Chameleon cloud. Experimental results shows how Asterism successfully and efficiently exploits combinations of diverse computational platforms, whereas DIaaS delivers specialized software to execute data-intensive applications in a scalable, efficient, and robust way reducing the engineering time and computational cost.",
keywords = "Data-Intensive science, Deployment and reusability of execution environments, scientific workows, stream-based system",
author = "Rosa Filgueira and Silva, {Rafael Ferreira Da} and Amrey Krause and Ewa Deelman and Malcolm Atkinson",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 7th International Workshop on Data-Intensive Computing in the Clouds, DataCloud 2016 ; Conference date: 14-11-2016",
year = "2017",
month = feb,
day = "6",
doi = "10.1109/DataCloud.2016.004",
language = "English",
series = "Proceedings of DataCloud 2016: 7th International Workshop on Data-Intensive Computing in the Clouds - Held in conjunction with SC 2016: The International Conference for High Performance Computing, Networking, Storage and Analysis",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1--8",
booktitle = "Proceedings of DataCloud 2016",
address = "United States",
}