@inproceedings{poey-etal-2025-ragulator,
title = "{RAG}ulator: Lightweight Out-of-Context Detectors for Grounded Text Generation",
author = "Poey, Ian and
Li1, Jiajun and
Zhong, Qishuai",
editor = "Potdar, Saloni and
Rojas-Barahona, Lina and
Montella, Sebastien",
booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing: Industry Track",
month = nov,
year = "2025",
address = "Suzhou (China)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-industry.73/",
pages = "1057--1071",
ISBN = "979-8-89176-333-3",
abstract = "Real-time identification of out-of-context outputs from large language models (LLMs) is crucial for enterprises to safely adopt retrieval augmented generation (RAG) systems. In this work, we develop lightweight models capable of detecting when LLM-generated text deviates from retrieved source documents semantically. We compare their performance against open-source alternatives on data from credit policy and sustainability reports used in the banking industry. The fine-tuned DeBERTa model stands out for its superior performance, speed, and simplicity, as it requires no additional preprocessing or feature engineering. While recent research often prioritises state-of-the-art accuracy through fine-tuned generative LLMs and complex training pipelines, we demonstrate how detection models are deployed efficiently with high speed and minimal resource usage."
}Markdown (Informal)
[RAGulator: Lightweight Out-of-Context Detectors for Grounded Text Generation](https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-industry.73/) (Poey et al., EMNLP 2025)
ACL