@inproceedings{mahasivam:hal-01677626, TITLE = {{Data Preparation as a Service Based on Apache Spark}}, AUTHOR = {Mahasivam, Nivethika and Nikolov, Nikolay and Sukhobok, Dina and Roman, Dumitru}, URL = {https://inria.hal.science/hal-01677626}, NOTE = {Part 4: Cloud Resources}, BOOKTITLE = {{6th European Conference on Service-Oriented and Cloud Computing (ESOCC)}}, ADDRESS = {Oslo, Norway}, EDITOR = {Flavio De Paoli and Stefan Schulte and Einar Broch Johnsen}, PUBLISHER = {{Springer International Publishing}}, SERIES = {Service-Oriented and Cloud Computing}, VOLUME = {LNCS-10465}, PAGES = {125-139}, YEAR = {2017}, MONTH = Sep, DOI = {10.1007/978-3-319-67262-5\_10}, KEYWORDS = {Distributed data parallel processing ; Apache Spark ; Big data preparation ; Interactive data preparation}, PDF = {https://inria.hal.science/hal-01677626/file/449571_1_En_10_Chapter.pdf}, HAL_ID = {hal-01677626}, HAL_VERSION = {v1}, }