@inproceedings{453371d96a494f3b8bb429cdfaa166a2,
title = "PEGASEF: A provenance-based big data service framework for efficient simulation execution on shared computing clusters",
abstract = "Over the past years high-performance computing (HPC) simulation programs have been aggressively employed to solve complex problems in a variety of computational science and engineering disciplines. As those programs are shared in an online platform, many users can easily run their simulations on the platform as long as they are connected on the web. However, repetitive simulations from users have charged a significant burden on the platform{\textquoteright}s limited computing and storage resources. To address the concern of inefficiency in simulation execution, we propose a big data service framework based on past simulation records. Such records are called provenances, which capture various properties in simulation. By utilizing the provenances, the platform can perform more efficient simulations via duplicate elimination and assist users with enhanced simulation service such as result prediction, execution-time estimation, and input-parameter clustering.",
keywords = "Big data, Duplicate elimination, Efficient simulation, HPC, Provenance, Service framework",
author = "Suh, {Young Kyoon} and Lee, {Ki Yong} and Nakhoon Baek",
note = "Publisher Copyright: {\textcopyright} Springer Nature Singapore Pte Ltd. 2019.; 4th International Conference on Big Data Applications and Services, BigDAS 2017 ; Conference date: 15-08-2017 Through 18-08-2017",
year = "2019",
doi = "10.1007/978-981-13-0695-2_17",
language = "English",
isbn = "9789811306945",
series = "Advances in Intelligent Systems and Computing",
publisher = "Springer Verlag",
pages = "175--182",
editor = "Leung, {Carson K.} and Wookey Lee",
booktitle = "Big Data Applications and Services 2017 - The 4th International Conference on Big Data Applications and Services",
address = "Germany",
}