@inproceedings{el-kishky-etal-2020-ccaligned, title = "{CCA}ligned: A Massive Collection of Cross-Lingual Web-Document Pairs", author = "El-Kishky, Ahmed and Chaudhary, Vishrav and Guzm{\'a}n, Francisco and Koehn, Philipp", editor = "Webber, Bonnie and Cohn, Trevor and He, Yulan and Liu, Yang", booktitle = "Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP)", month = nov, year = "2020", address = "Online", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2020.emnlp-main.480/", doi = "10.18653/v1/2020.emnlp-main.480", pages = "5960--5969" }