@inproceedings{shafique-etal-2025-culturally, title = "A Culturally-diverse Multilingual Multimodal Video Benchmark {\&} Model", author = "Shafique, Bhuiyan Sanjid and Vayani, Ashmal and Maaz, Muhammad and Rasheed, Hanoona Abdul and Dissanayake, Dinura and Kurpath, Mohammed Irfan and Hmaiti, Yahya and Inoue, Go and Lahoud, Jean and Rashid, Md. Safirur and Quasem, Shadid Intisar and Fatima, Maheen and Vidal, Franco and Maslych, Mykola and More, Ketan Pravin and Baliah, Sanoojan and Watawana, Hasindri and Li, Yuhao and Farestam, Fabian and Schaller, Leon and Tymtsiv, Roman and Weber, Simon and Cholakkal, Hisham and Laptev, Ivan and Satoh, Shin{'}ichi and Felsberg, Michael and Shah, Mubarak and Khan, Salman and Khan, Fahad Shahbaz", editor = "Christodoulopoulos, Christos and Chakraborty, Tanmoy and Rose, Carolyn and Peng, Violet", booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing", month = nov, year = "2025", address = "Suzhou, China", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-main.1012/", pages = "20009--20033", ISBN = "979-8-89176-332-6" }