@inproceedings{chen-etal-2021-multimodal, title = "Multimodal Incremental Transformer with Visual Grounding for Visual Dialogue Generation", author = "Chen, Feilong and Meng, Fandong and Chen, Xiuyi and Li, Peng and Zhou, Jie", editor = "Zong, Chengqing and Xia, Fei and Li, Wenjie and Navigli, Roberto", booktitle = "Findings of the Association for Computational Linguistics: ACL-IJCNLP 2021", month = aug, year = "2021", address = "Online", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/Add-Cong-Liu-Florida-Atlantic-University-author-id/2021.findings-acl.38/", doi = "10.18653/v1/2021.findings-acl.38", pages = "436--446" }