@inproceedings{8cba16dc959d4a5bb759fd5d8114921a,
title = "Hybrid method of undersampling and oversampling for handling imbalanced data",
abstract = "Imbalance of data occurs in various kinds of data including natural imbalanced data. If the computation process of the imbalanced data is carried out (for example clustering), the data imbalance has the potential to cause misclassification because the majority data is more dominant on minority data which results in a decrease in accuracy. The combination method of oversampling and undersampling can be one solution in solving imbalance cases. This study aims to address the problem of imbalanced data by combining the oversampling method with the undersampling method to obtain more representative synthetic data. In this study, the undersampling methods used is Neighborhood Cleaning Rules (NCL. While Adaptive Semiunsupervised Weighted Oversampling (A-SUWO) will be used as the oversampling method. After the undersampling and oversampling process is carried out, the data will be classified using the Decision Tree C4.5 and Random Forest algorithm. Performance evaluation will be processed using the calculation of precision, recall, F-measure and accuracy.",
keywords = "A-SUWO, Imbalance, NCL, Natural data, Oversampling, Undersampling",
author = "Shabrina Choirunnisa and Joko Lianto",
note = "Publisher Copyright: {\textcopyright} 2018 IEEE.; 2018 International Seminar on Research of Information Technology and Intelligent Systems, ISRITI 2018 ; Conference date: 21-11-2018 Through 22-11-2018",
year = "2018",
month = nov,
doi = "10.1109/ISRITI.2018.8864335",
language = "English",
series = "2018 International Seminar on Research of Information Technology and Intelligent Systems, ISRITI 2018",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "276--280",
booktitle = "2018 International Seminar on Research of Information Technology and Intelligent Systems, ISRITI 2018",
address = "United States",
}