@inproceedings{a114a9f2403f424799c31977922cc3f1,
title = "Multi Label Sound Classification using Deep Learning Models",
abstract = "Accurate and automated sound classification enables a strong groundwork for diverse advanced deep learning applications within the audio and music domain. This study focuses on the application of Convolutional Neural Networks (CNN) and combined LSTM (Long Short-Term Memory) and GRU (Gated Recurrent unit) models for instrument classification from audio signals, contributing to intelligent audio processing systems. Our proposed model exclusively utilizes the Mel-frequency cepstral coefficients (MFCCs) extraction from the audio data for preprocessing. A large and complex dataset, including Nineteen instrument classes are used for training and evaluation. These experimental results demonstrate promising performance, with our proposed CNN architecture achieving an impressive accuracy of 97%, and the LSTM-GRU model achieves a lower accuracy of 80%, compared to the CNN model on the multi-label sound classification task for instruments classes, but its ability to model temporal dependencies add valuable insights into the dynamics of instrument audio sequences. These findings provide valuable insights for researchers and practitioners in audio signal processing and machine learning.",
keywords = "audio classification, CNN, deep learning, GRU, instrument recognition, LSTM, MFCCs, multi-label classification, sound classification",
author = "Onisha, {Tasnim Akter} and Jongyeop Kim and Jongho Seol",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 22nd IEEE/ACIS International Conference on Software Engineering Research, Management and Applications, SERA 2024 ; Conference date: 30-05-2024 Through 01-06-2024",
year = "2024",
doi = "10.1109/SERA61261.2024.10685563",
language = "English",
series = "2024 IEEE/ACIS 22nd International Conference on Software Engineering Research, Management and Applications, SERA 2024 - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "129--134",
editor = "Teruhisa Hochin and Jixin Ma and Osamu Mizuno",
booktitle = "2024 IEEE/ACIS 22nd International Conference on Software Engineering Research, Management and Applications, SERA 2024 - Proceedings",
address = "United States",
}