@inproceedings{183fdd426c0942aba8ff98887ed163cc,
title = "A UNIFIED LOSS FUNCTION TO TACKLE INTER-CLASS AND INTRA-CLASS DATA IMBALANCE IN SOUND EVENT DETECTION",
abstract = "Data imbalance is an important issue in data-driven deep-learning methodologies. In sound event detection (SED), there are two types of data imbalance issues caused by the diverse time duration of sound events: the data imbalance between sound event classes (inter-class imbalance) and the active/inactive imbalance within the class (intra-class imbalance). In this paper, we propose a unified loss function (ULF), which adeptly addresses both the inter-class imbalance and intra-class imbalance simultaneously. Evaluation experiments substantiate that the ULF consistently yields superior and more stable performance compared to existing loss functions that singularly address either type of imbalance. Furthermore, the ULF loss also enhances the model's capacity to detect hard-to-detect sound events.",
keywords = "data imbalance, loss function, Sound event detection",
author = "Yuliang Zhang and Roberto Togneri and David Huang",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 49th IEEE International Conference on Acoustics, Speech, and Signal Processing,, ICASSP 2024 ; Conference date: 14-04-2024 Through 19-04-2024",
year = "2024",
doi = "10.1109/ICASSP48485.2024.10447675",
language = "English",
isbn = "979-8-3503-4486-8",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
publisher = "IEEE, Institute of Electrical and Electronics Engineers",
pages = "996--1000",
booktitle = "ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)",
address = "United States",
}