@inproceedings{10445941,author={Tseng, Yuan and Berry, Layne and Chen, Yi-Ting and Chiu, I-Hsiang and Lin, Hsuan-Hao and Liu, Max and Peng, Puyuan and Shih, Yi-Jen and Wang, Hung-Yu and Wu, Haibin and Huang, Po-Yao and Lai, Chun-Mao and Li, Shang-Wen and Harwath, David and Tsao, Yu and Mohamed, Abdelrahman and Feng, Chi-Luen and Lee, Hung-Yi},booktitle={ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},title={AV-SUPERB: A Multi-Task Evaluation Benchmark for Audio-Visual Representation Models},year={2024},volume={},number={},pages={6890-6894},keywords={Representation learning;Visualization;Soft sensors;Benchmark testing;Signal processing;Task analysis;Speech processing;Audio-Visual Learning;Representation Learning;Evaluation;Self-Supervised Learning},doi={10.1109/ICASSP48485.2024.10445941},}