@inproceedings{gao-etal-2022-caponimage, title = "{C}ap{O}n{I}mage: Context-driven Dense-Captioning on Image", author = "Gao, Yiqi and Hou, Xinglin and Zhang, Yuanmeng and Ge, Tiezheng and Jiang, Yuning and Wang, Peng", editor = "Goldberg, Yoav and Kozareva, Zornitsa and Zhang, Yue", booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing", month = dec, year = "2022", address = "Abu Dhabi, United Arab Emirates", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.emnlp-main.226/", doi = "10.18653/v1/2022.emnlp-main.226", pages = "3449--3465" }