@inbook{43e346dbf41b41c189060dc8462b3f29,
title = "Robustness of Support Vector Regression and Random Forest Models: A Simulation Study",
abstract = "Classical statistics are usually based on parametric models, where the performance depends heavily on assumptions and is not robust in the presence of outliers in the data. Due to the COVID-19 pandemic, our daily lives have changed significantly, including slowing economic growth. These extreme changes can manifest as an outlier in time series studies and adversely affect the results of data analysis. Many classical methods of official statistics are prone to outliers. In this work, we evaluate machine learning methods: Support Vector Regression (SVR) and Random Forest (RF) and compare it with ARIMA to determine the robustness through simulation studies. Robustness is measured by the sensitivity of the SVR and Random Forest hyperparameter and the model{\textquoteright}s error in the presence of outliers. Simulations show that more outliers lead to higher RMSE values, and conversely, more samples lead to lower RMSE values. The type of outliers significantly impacts the RMSE value of the ARIMA model, where additional outliers (AO) have a worse impact than temporary change (TC). Consecutive outliers produce a smaller RMSE mean than non-consecutive outliers. Based on the sensitivity of hyperparameters, SVR and Random Forest models are relatively robust to the presence of outliers in the data. Based on the simulation results of 100 iterations, we find that SVR is more robust than ARIMA and Random Forest in modeling time series data with outliers.",
keywords = "Outlier, Random forest, Robustness, Support vector regression",
author = "Supriadi Hia and Heri Kuswanto and Prastyo, {Dedy Dwi}",
note = "Publisher Copyright: {\textcopyright} 2023, The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd.",
year = "2023",
doi = "10.1007/978-981-99-0741-0_33",
language = "English",
series = "Lecture Notes on Data Engineering and Communications Technologies",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "465--479",
booktitle = "Lecture Notes on Data Engineering and Communications Technologies",
address = "Germany",
}