@inproceedings{hu-etal-2019-looking, title = "Are You Looking? Grounding to Multiple Modalities in Vision-and-Language Navigation", author = "Hu, Ronghang and Fried, Daniel and Rohrbach, Anna and Klein, Dan and Darrell, Trevor and Saenko, Kate", editor = "Korhonen, Anna and Traum, David and M{\`a}rquez, Llu{\'i}s", booktitle = "Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics", month = jul, year = "2019", address = "Florence, Italy", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/P19-1655/", doi = "10.18653/v1/P19-1655", pages = "6551--6557" }