@inproceedings{40d3da3dca634c1f8d1518a58d92a7e0,
title = "Deep Multilayer Perceptrons for Dimensional Speech Emotion Recognition",
abstract = "Modern deep learning architectures are ordinarily performed in high performance computing facilities due to the large size of their input features and complexity of their models. This paper proposes traditional multilayer perceptrons (MLP) with deep layers and small input sizes to tackle this computation requirement limitation. This study compares a proposed deep MLP method to the more modern deep learning architectures with the same number of layers, batch size, and optimizer. The result shows that our proposed deep MLP outperformed modern deep learning architectures, i.e., LSTM and CNN, on the same number of layers and value of parameters. Both proposed and benchmark methods were optimized in the same way. The deep MLP exhibited the highest performance on both speaker-dependent and speaker-independent scenarios on IEMOCAP and MSP-IMPROV datasets.",
keywords = "Affective computing, dimensional emotion, multilayer perceptrons, neural networks, speech emotion recognition",
author = "Atmaja, {Bagus Tris} and Masato Akagi",
note = "Publisher Copyright: {\textcopyright} 2020 APSIPA.; 2020 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2020 ; Conference date: 07-12-2020 Through 10-12-2020",
year = "2020",
month = dec,
day = "7",
language = "English",
series = "2020 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2020 - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "325--331",
booktitle = "2020 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2020 - Proceedings",
address = "United States",
}