@inproceedings{du-etal-2025-makes, title = "What Makes for Good Visual Instructions? Synthesizing Complex Visual Reasoning Instructions for Visual Instruction Tuning", author = "Du, Yifan and Guo, Hangyu and Zhou, Kun and Zhao, Wayne Xin and Wang, Jinpeng and Wang, Chuyuan and Cai, Mingchen and Song, Ruihua and Wen, Ji-Rong", editor = "Rambow, Owen and Wanner, Leo and Apidianaki, Marianna and Al-Khalifa, Hend and Eugenio, Barbara Di and Schockaert, Steven", booktitle = "Proceedings of the 31st International Conference on Computational Linguistics", month = jan, year = "2025", address = "Abu Dhabi, UAE", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/Add-Cong-Liu-Florida-Atlantic-University-author-id/2025.coling-main.546/", pages = "8197--8214" }