@inproceedings{mcnamee-etal-2025-oj4ocrmt, title = "{OJ}4{OCRMT}: A Large Multilingual Dataset for {OCR}-{MT} Evaluation", author = "McNamee, Paul and Duh, Kevin and Carpenter, Cameron and Colaianni, Ron and King, Nolan and Murray, Kenton", editor = "Bouillon, Pierrette and Gerlach, Johanna and Girletti, Sabrina and Volkart, Lise and Rubino, Raphael and Sennrich, Rico and Farinha, Ana C. and Gaido, Marco and Daems, Joke and Kenny, Dorothy and Moniz, Helena and Szoc, Sara", booktitle = "Proceedings of Machine Translation Summit XX: Volume 1", month = jun, year = "2025", address = "Geneva, Switzerland", publisher = "European Association for Machine Translation", url = "https://preview.aclanthology.org/mtsummit-25-ingestion/2025.mtsummit-1.9/", pages = "113--125", ISBN = "978-2-9701897-0-1" }