@inproceedings{04336b5fdbab4466ab9a23ee8bfea469,
title = "Performance evaluation of anomaly detection in imbalanced system log data",
abstract = "An administrator needs to examine operating system log files for any anomalous events. In real-life log data, the number of anomalies is often smaller than the normal ones. This imbalance situation affects the performance of the anomaly detectors because a large number of normal events feed the training of the classifier. In this paper, we evaluate popular machine learning methods and consider this problem of data imbalance. We compare data oversampling and undersampling approaches before inputting them to the classifier. Experimental results demonstrate that by taking data imbalance into consideration, there is an improvement in the method performance in terms of precision and recall scores.",
keywords = "Anomaly detection, Imbalanced data, Machine learning, System logs",
author = "Hudan Studiawan and Ferdous Sohel",
note = "Publisher Copyright: {\textcopyright} 2020 IEEE.; 2020 World Conference on Smart Trends in Systems, Security and Sustainability, WS4 2020 ; Conference date: 27-07-2020 Through 28-07-2020",
year = "2020",
month = jul,
doi = "10.1109/WorldS450073.2020.9210329",
language = "English",
series = "Proceedings of the World Conference on Smart Trends in Systems, Security and Sustainability, WS4 2020",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "239--246",
editor = "Xin-She Yang and Fong, {Simon James} and Toapanta, {Segundo Moises} and Ion Andronache and Niko Phillips",
booktitle = "Proceedings of the World Conference on Smart Trends in Systems, Security and Sustainability, WS4 2020",
address = "United States",
}