@inproceedings{efrat-etal-2021-cryptonite,
title = "Cryptonite: A Cryptic Crossword Benchmark for Extreme Ambiguity in Language",
author = "Efrat, Avia and
Shaham, Uri and
Kilman, Dan and
Levy, Omer",
editor = "Moens, Marie-Francine and
Huang, Xuanjing and
Specia, Lucia and
Yih, Scott Wen-tau",
booktitle = "Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2021",
address = "Online and Punta Cana, Dominican Republic",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2021.emnlp-main.344/",
doi = "10.18653/v1/2021.emnlp-main.344",
pages = "4186--4192",
abstract = "Current NLP datasets targeting ambiguity can be solved by a native speaker with relative ease. We present Cryptonite, a large-scale dataset based on cryptic crosswords, which is both linguistically complex and naturally sourced. Each example in Cryptonite is a cryptic clue, a short phrase or sentence with a misleading surface reading, whose solving requires disambiguating semantic, syntactic, and phonetic wordplays, as well as world knowledge. Cryptic clues pose a challenge even for experienced solvers, though top-tier experts can solve them with almost 100{\%} accuracy. Cryptonite is a challenging task for current models; fine-tuning T5-Large on 470k cryptic clues achieves only 7.6{\%} accuracy, on par with the accuracy of a rule-based clue solver (8.6{\%})."
}
Markdown (Informal)
[Cryptonite: A Cryptic Crossword Benchmark for Extreme Ambiguity in Language](https://preview.aclanthology.org/fix-sig-urls/2021.emnlp-main.344/) (Efrat et al., EMNLP 2021)
ACL