@inproceedings{wang-etal-2022-ita, title = "{ITA}: Image-Text Alignments for Multi-Modal Named Entity Recognition", author = "Wang, Xinyu and Gui, Min and Jiang, Yong and Jia, Zixia and Bach, Nguyen and Wang, Tao and Huang, Zhongqiang and Tu, Kewei", editor = "Carpuat, Marine and de Marneffe, Marie-Catherine and Meza Ruiz, Ivan Vladimir", booktitle = "Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies", month = jul, year = "2022", address = "Seattle, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2022.naacl-main.232/", doi = "10.18653/v1/2022.naacl-main.232", pages = "3176--3189" }