@article{hendricks-etal-2021-decoupling, title = "Decoupling the Role of Data, Attention, and Losses in Multimodal Transformers", author = "Hendricks, Lisa Anne and Mellor, John and Schneider, Rosalia and Alayrac, Jean-Baptiste and Nematzadeh, Aida", editor = "Roark, Brian and Nenkova, Ani", journal = "Transactions of the Association for Computational Linguistics", volume = "9", year = "2021", address = "Cambridge, MA", publisher = "MIT Press", url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2021.tacl-1.35/", doi = "10.1162/tacl_a_00385", pages = "570--585" }