@inproceedings{sainz-etal-2023-nlp, title = "{NLP} Evaluation in trouble: On the Need to Measure {LLM} Data Contamination for each Benchmark", author = "Sainz, Oscar and Campos, Jon and Garc{\'i}a-Ferrero, Iker and Etxaniz, Julen and de Lacalle, Oier Lopez and Agirre, Eneko", editor = "Bouamor, Houda and Pino, Juan and Bali, Kalika", booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2023", month = dec, year = "2023", address = "Singapore", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.findings-emnlp.722/", doi = "10.18653/v1/2023.findings-emnlp.722", pages = "10776--10787" }