@inproceedings{zheng-etal-2026-doc, title = "Doc-$V^*$: Coarse-to-Fine Interactive Visual Reasoning for Multi-Page Document {VQA}", author = "Zheng, Yuanlei and Fu, Pei and Li, Hang and Wang, Ziyang and Zhang, Yuyi and Ruan, Wenyu and Zhang, Xiaojin and Wei, Zhongyu and Luo, Zhenbo and Luan, Jian and Chen, Wei and Bai, Xiang", editor = "Liakata, Maria and Moreira, Viviane P. and Zhang, Jiajun and Jurgens, David", booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.2129/", pages = "45901--45923", ISBN = "979-8-89176-390-6" }