@inproceedings{d2cc5c5348dc4f64830e73b6c94e858b,
title = "DuFCALF: Instilling Sentience in Computerized Song Analysis",
abstract = "Music recommendation systems have evolved significantly in the past couple of years and have become extremely popular with the advancement of Artificial Intelligence (AI). Such systems categorize songs based on disparate perspectives, like genre, artist, tempo, etc. However, there have been fewer developments in the purview of song categorization based on feelings. Songs amplify the mood of a person and often, listeners choose the type of song they want to listen to based on their mood. Hence, modeling the emotional content of songs is crucial. However, this is a challenging affair because songs embody multiple instruments and vocals in a single instance. Each of them is often modulated differently for a better experience for the listeners as well. This is very common for present-day songs and many songs of different emotions often have very similar instruments and chord progressions which further enhances the challenge. In this paper, a system is presented to distinguish song clips based on their emotion. The clips were parameterized using two features which were fed to disparate deep networks. Thereafter, a dual feature cross architecture late fusion (DuFCALF) strategy was used to distinguish the moods. Experiments were performed with multitudinous sections of songs to test its efficacy for limited data and the sadness of songs was captured with over 80% accuracy. An overall increase of 4.43% in distinction of the emotions was obtained using DuFCALF over the best-performing baseline system.",
keywords = "Audioscape, Deep learning, Emotion, Music analysis",
author = "Himadri Mukherjee and Matteo Marciano and Ankita Dhar and Kaushik Roy",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2025.; 26th International Conference on Speech and Computer, SPECOM 2024 ; Conference date: 25-11-2024 Through 28-11-2024",
year = "2025",
doi = "10.1007/978-3-031-78014-1_21",
language = "English (US)",
isbn = "9783031780134",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "277--292",
editor = "Alexey Karpov and Vlado Deli{\'c}",
booktitle = "Speech and Computer - 26th International Conference, SPECOM 2024, Proceedings",
address = "Germany",
}