@inproceedings{f2b8ef9b2bd04c8789f86061e07bd157,
title = "Word-Embedding Model for Evaluating Text Generation of Imbalanced Spam Reviews",
abstract = "Generating minor class data of spam texts is expected to solve the imbalanced problem in spam detection of product reviews. There could be semantic differences between the generated texts and the original ones. Thus, by including the semantically differed texts in the spam dataset used for training is like a noise addition. For evaluating the generated texts, some manual preparations of ground-truth data are necessary. This work has evaluated the generated texts with some approaches to ensure their context and sequence similarities compared to the original texts for better performance of a spam detection. The employed approaches are expected to eliminate the manual tasks. Our research proposes an evaluation model that consists of word-embedding pre-trained and LSTM Siamese to evaluate text generation in imbalance review. The use of a combination of pre-trained word embedding and LSTM Siamese trained model will capture the semantic aspect of the text.",
keywords = "imbalance review, pre-trained model, spam detection, text generation, word embedding",
author = "Diana Purwitasari and Zaqiyah, {Ana Alimatus} and Chastine Fatichah",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 13th International Conference on Advanced Computer Science and Information Systems, ICACSIS 2021 ; Conference date: 23-10-2021 Through 26-10-2021",
year = "2021",
doi = "10.1109/ICACSIS53237.2021.9631315",
language = "English",
series = "2021 International Conference on Advanced Computer Science and Information Systems, ICACSIS 2021",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2021 International Conference on Advanced Computer Science and Information Systems, ICACSIS 2021",
address = "United States",
}