@article{dycke-gurevych-2026-automatic, title = "Automatic Reviewers Fail to Detect Faulty Reasoning in Research Papers: A New Counterfactual Evaluation Framework", author = "Dycke, Nils and Gurevych, Iryna", journal = "Transactions of the Association for Computational Linguistics", volume = "14", year = "2026", address = "Cambridge, MA", publisher = "MIT Press", url = "https://preview.aclanthology.org/ingest-latest-mitpress-cl-tacl/2026.tacl-1.22/", doi = "10.1162/tacl.a.642", pages = "465--488" }