@inproceedings{betala-etal-2025-picture, title = "A Picture is Worth a Thousand (Correct) Captions: A Vision-Guided Judge-Corrector System for Multimodal Machine Translation", author = "Betala, Siddharth and Raj, Kushan and Betala, Vipul and Saswade, Rohan", editor = "Nakazawa, Toshiaki and Goto, Isao", booktitle = "Proceedings of the Twelfth Workshop on Asian Translation (WAT 2025)", month = dec, year = "2025", address = "Mumbai, India", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.wat-1.13/", pages = "124--137", ISBN = "979-8-89176-309-8" }