@inproceedings{li-etal-2024-open-source, title = "An Open-Source Data Contamination Report for Large Language Models", author = "Li, Yucheng and Guo, Yunhao and Guerin, Frank and Lin, Chenghua", editor = "Al-Onaizan, Yaser and Bansal, Mohit and Chen, Yun-Nung", booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2024", month = nov, year = "2024", address = "Miami, Florida, USA", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/moar-dois/2024.findings-emnlp.30/", doi = "10.18653/v1/2024.findings-emnlp.30", pages = "528--541" }