@inproceedings{wang-etal-2024-slideavsr, title = "{S}lide{AVSR}: A Dataset of Paper Explanation Videos for Audio-Visual Speech Recognition", author = "Wang, Hao and Kurita, Shuhei and Shimizu, Shuichiro and Kawahara, Daisuke", editor = "Gu, Jing and Fu, Tsu-Jui (Ray) and Hudson, Drew and Celikyilmaz, Asli and Wang, William", booktitle = "Proceedings of the 3rd Workshop on Advances in Language and Vision Research (ALVR)", month = aug, year = "2024", address = "Bangkok, Thailand", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2024.alvr-1.11/", doi = "10.18653/v1/2024.alvr-1.11", pages = "129--137" }