@inproceedings{kim-etal-2021-cleaning-dirty, title = "Cleaning Dirty Books: Post-{OCR} Processing for Previously Scanned Texts", author = "Kim, Allen and Pethe, Charuta and Inoue, Naoya and Skiena, Steve", editor = "Moens, Marie-Francine and Huang, Xuanjing and Specia, Lucia and Yih, Scott Wen-tau", booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2021", month = nov, year = "2021", address = "Punta Cana, Dominican Republic", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2021.findings-emnlp.356/", doi = "10.18653/v1/2021.findings-emnlp.356", pages = "4217--4226" }