@inproceedings{du-etal-2026-multimodal, title = "Multimodal Generative Engine Optimization: Rank Manipulation for Vision{--}Language Model Rankers", author = "Du, Yixuan and Yu, Chenxiao and Xu, Haoyan and Wang, Ziyi and Zhao, Yue and Hu, Xiyang", editor = "Chen, Canyu and Zhang, Yuji and Li, Zoey Sha and Wang, Zihan and Wang, Qineng and Su, Jinyan and Kargupta, Priyanka and Marjanovi{\'c}, Sara Vera and Pan, Jeff Z. and Bansal, Mohit and Augenstein, Isabelle and Han, Jiawei and Ji, Heng and Li, Manling", booktitle = "Proceedings of the 4th Workshop on Towards Knowledgeable Foundation Models ({K}now{FM} 2026)", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.knowfm-1.9/", pages = "115--128", ISBN = "979-8-89176-403-3" }