Data: https://huggingface.co/datasets/apple121/sseu-bench
Papaer: https://arxiv.org/abs/2509.13148
@inproceedings{sseu-bench,
title={Can Large Audio Language Models Understand Audio Well? Speech, Scene and Events Understanding Benchmark for LALMs},
author={Yin, Han and Choi, Jung-Woo},
booktitle={ICASSP 2026-2026 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
pages={1--5},
year={2026},
organization={IEEE}
}