@inproceedings{zhu-etal-2024-alignment, title = "Alignment before Awareness: Towards Visual Question Localized-Answering in Robotic Surgery via Optimal Transport and Answer Semantics", author = "Zhu, Zhihong and Zhang, Yunyan and Cheng, Xuxin and Huang, Zhiqi and Xu, Derong and Wu, Xian and Zheng, Yefeng", editor = "Calzolari, Nicoletta and Kan, Min-Yen and Hoste, Veronique and Lenci, Alessandro and Sakti, Sakriani and Xue, Nianwen", booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)", month = may, year = "2024", address = "Torino, Italia", publisher = "ELRA and ICCL", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.lrec-main.63/", pages = "711--721" }