@inproceedings{nurani-venkitasubramanian-etal-2017-learning, title = "Learning to Recognize Animals by Watching Documentaries: Using Subtitles as Weak Supervision", author = "Nurani Venkitasubramanian, Aparna and Tuytelaars, Tinne and Moens, Marie-Francine", editor = "Belz, Anya and Erdem, Erkut and Pastra, Katerina and Mikolajczyk, Krystian", booktitle = "Proceedings of the Sixth Workshop on Vision and Language", month = apr, year = "2017", address = "Valencia, Spain", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/W17-2003/", doi = "10.18653/v1/W17-2003", pages = "21--30" }