@inproceedings{13a1ffb53ec94d6c94ba195d8f92984f,
title = "Using Synthetic Data for Improving Robustness and Resilience in ML-Based Smart Services",
abstract = "We set to answer the question of whether robustness and resilience of machine learning (ML) based smart services in the Internet-of-Things (IoT) context can be improved by using synthetic data. These data can be in the form of training data for ML algorithms or service interactions. While there is plenty of research on the use of synthetic data in general ML models, there is a lack of understanding on the use of synthetic data in the smart service context. This can help make smart services more resilient by solving the cold-start problem and improve their generalization capabilities. We propose an architecture for ML-based smart services that integrates both real and synthetic data and perform an empirical evaluation than combines publicly available sensor data (streamflow data) and state-of-the-art synthetic data generation methods. Using standard performance metrics, our results show that enhancing a dataset with synthetic data can improve performance significantly even with a modest amount of data.",
keywords = "machine learning, resilience, robustness, smart services, Smart services, Machine learning, Synthetic data",
author = "Rub{\'e}n Ruiz-Torrubiano and Gerhard Kormann-Hainzl and Sarita Paudel",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2024.; Smart Services Summit ; Conference date: 27-10-2023",
year = "2024",
month = jul,
day = "31",
doi = "10.1007/978-3-031-60313-6_1",
language = "English",
isbn = "978-3-031-60312-9",
series = "Progress in IS",
publisher = "Springer International Publishing AG",
pages = "3--13",
booktitle = "Progress in IS",
address = "Switzerland",
}