@inproceedings{pan-etal-2026-mt, title = "{MT}-Video-Bench: A Holistic Video Understanding Benchmark for Evaluating Multimodal {LLM}s in Multi-Turn Dialogues", author = "Pan, Yaning and Xie, Qianqian and Zhang, Guohui and Wang, Zekun Moore and Wen, Yongqian and Zhang, Yuanxing and Hu, Haoxuan and Pan, Zhiyu and Huang, Yibing and Gan, Zhidong and Lin, Yonghong and Ping, An and Li, Shihao and Wang, Yanghai and Peng, Tianhao and Liu, Jiaheng", editor = "Liakata, Maria and Moreira, Viviane P. and Zhang, Jiajun and Jurgens, David", booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.397/", pages = "8105--8126", ISBN = "979-8-89176-395-1" }