@article{thomson-etal-2024-common, title = "Common Flaws in Running Human Evaluation Experiments in {NLP}", author = "Thomson, Craig and Reiter, Ehud and Belz, Anya", journal = "Computational Linguistics", volume = "50", number = "2", month = jun, year = "2024", address = "Cambridge, MA", publisher = "MIT Press", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.cl-2.9/", doi = "10.1162/coli_a_00508", pages = "795--805" }