@inproceedings{827a1b5dd060431eb8bbd0846ae12d0f,
title = "Dispel4py: An agile framework for data-intensive eScience",
abstract = "We present dispel4py a versatile data-intensive kit presented as a standard Python library. It empowers scientists to experiment and test ideas using their familiar rapid-prototyping environment. It delivers mappings to diverse computing infrastructures, including cloud technologies, HPC architectures and specialised data-intensive machines, to move seamlessly into production with large-scale data loads. The mappings are fully automated, so that the encoded data analyses and data handling are completely unchanged. The underpinning model is lightweight composition of fine-grained operations on data, coupled together by data streams that use the lowest cost technology available. These fine-grained workflows are locally interpreted during development and mapped to multiple nodes and systems such as MPI and Storm for production. We explain why such an approach is becoming more essential in order that data-driven research can innovate rapidly and exploit the growing wealth of data while adapting to current technical trends. We show how provenance management is provided to improve understanding and reproducibility, and how a registry supports consistency and sharing. Three application domains are reported and measurements on multiple infrastructures show the optimisations achieved. Finally we present the next steps to achieve scalability and performance.",
keywords = "Data intensive application, Distributed systems, ESciences workflows, Python frameworks, Run time analysis",
author = "Rosa Filgueira and Amrey Krause and Malcolm Atkinson and Iraklis Klampanos and Alessandro Spinuso and Susana Sanchez-Exposito",
note = "Funding Information: This research was supported by the VERCE project (EU FP7 RI 283543) and the Terracorrelator project (funded by NERC NE/L012979/1). Publisher Copyright: {\textcopyright} 2015 IEEE.; 11th IEEE International Conference on eScience, eScience 2015 ; Conference date: 31-08-2015 Through 04-09-2015",
year = "2015",
month = oct,
day = "22",
doi = "10.1109/eScience.2015.40",
language = "English",
series = "Proceedings - 11th IEEE International Conference on eScience, eScience 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "454--464",
booktitle = "Proceedings - 11th IEEE International Conference on eScience, eScience 2015",
address = "United States",
}