@inproceedings{bulat-etal-2024-efficient, title = "Efficient Vision-Language pre-training via domain-specific learning for human activities", author = "Bulat, Adrian and Ouali, Yassine and Guerrero, Ricardo and Martinez, Brais and Tzimiropoulos, Georgios", editor = "Al-Onaizan, Yaser and Bansal, Mohit and Chen, Yun-Nung", booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing", month = nov, year = "2024", address = "Miami, Florida, USA", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.emnlp-main.454/", doi = "10.18653/v1/2024.emnlp-main.454", pages = "7978--8000" }