@inproceedings{ehsan-solorio-2026-scalable,
title = "A Scalable Framework for Automated {NER} Annotation Correction in Low-Resource Languages",
author = "Ehsan, Toqeer and
Solorio, Thamar",
editor = "Demberg, Vera and
Inui, Kentaro and
Marquez, Llu{\'i}s",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {EACL} 2026",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-eacl/2026.findings-eacl.215/",
pages = "4138--4151",
ISBN = "979-8-89176-386-9",
abstract = "Poor quality or noisy annotations in Named Entity Recognition (NER), as in any other NLP task, make it challenging to achieve state-of-the-art performance. In this paper, we present a multi-step framework to enhance the annotation quality of NER datasets by employing automated techniques. We propose a frequency-based iterative approach that leverages self-training and a dual-threshold mechanism to enhance inference confidence. Experimental evaluations on different NER datasets demonstrate significant improvements in NER performance with respect to the original datasets. This work further explores the potential of generative Large Language Models (LLMs) to perform NER for low-resource languages."
}Markdown (Informal)
[A Scalable Framework for Automated NER Annotation Correction in Low-Resource Languages](https://preview.aclanthology.org/ingest-eacl/2026.findings-eacl.215/) (Ehsan & Solorio, Findings 2026)
ACL