@inproceedings{you-etal-2025-cross, title = "Cross-modal Clustering-based Retrieval for Scalable and Robust Image Captioning", author = "You, Jingyi and Sasaki, Hiroshi and Kadowaki, Kazuma", editor = "Kriz, Reno and Murray, Kenton", booktitle = "Proceedings of the 1st Workshop on Multimodal Augmented Generation via Multimodal Retrieval (MAGMaR 2025)", month = aug, year = "2025", address = "Vienna, Austria", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/landing_page/2025.magmar-1.4/", pages = "47--58", ISBN = "979-8-89176-280-0" }