@inbook{8e8ea4823d0a47cd8db35c19afcd3d68,
title = "The Impact of Clustering-Based Sequential Multivariate Outliers Detection in Handling Missing Values",
abstract = "The presence of missing values is a common issue that frequently leads to incomplete data in a wide range of research. They diminish the accessibility of the dataset that can be utilized and degrade the statistical power of the analysis. A significant focus in numerous studies has been directed toward the methods of missing value imputation. In cases where the dataset includes outliers, the imputation of missing values might be incorrect or significantly deviate from the actual values. One of the challenges that impacts the quality of data is the handling of missing values and outliers simultaneously. Several studies removed outliers before imputing missing values or deleted observations with missing values before detecting outliers. The removal approach leads to a lack of information included within the data. Other researchers integrate clustering methods into the process of missing value imputation to mitigate the impact of outliers and data variations, thereby enhancing the accuracy of the imputation model. This paper proposes a new clustering-based sequential multivariate outlier detection (SMOD) method to effectively handle incomplete data within outliers. The method is applied to an official economic statistics dataset that involves outliers and performs a missing value rate scenario of about 50 percent. In comparison with a well-known and widely used clustering technique, i.e., model-based clustering (MBC), the proposed method works well in missing value imputation.",
keywords = "Clustering, Missing value, Multiple imputation, Outlier detection",
author = "Mety Agustini and Kartika Fithriasari and Prastyo, {Dedy Dwi}",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2024.",
year = "2024",
doi = "10.1007/978-981-97-0293-0_17",
language = "English",
series = "Lecture Notes on Data Engineering and Communications Technologies",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "221--235",
booktitle = "Lecture Notes on Data Engineering and Communications Technologies",
address = "Germany",
}