@inproceedings{mitra-etal-2025-factlens,
title = "{F}act{L}ens: Benchmarking Fine-Grained Fact Verification",
author = "Mitra, Kushan and
Zhang, Dan and
Rahman, Sajjadur and
Hruschka, Estevam",
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Findings of the Association for Computational Linguistics: ACL 2025",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingestion-acl-25/2025.findings-acl.929/",
pages = "18085--18096",
ISBN = "979-8-89176-256-5",
abstract = "Large Language Models (LLMs) have shown impressive capability in language generation and understanding, but their tendency to hallucinate and produce factually incorrect information remains a key limitation. To verify LLM-generated contents and claims from other sources, traditional verification approaches often rely on holistic models that assign a single factuality label to complex claims, potentially obscuring nuanced errors. In this paper, we advocate for a shift towards fine-grained verification, where complex claims are broken down into smaller sub-claims for individual verification, allowing for more precise identification of inaccuracies, improved transparency, and reduced ambiguity in evidence retrieval. However, generating sub-claims poses challenges, such as maintaining context and ensuring semantic equivalence with respect to the original claim. We introduce **FactLens**, a benchmark for evaluating fine-grained fact verification, with metrics and automated evaluators of sub-claim quality. The benchmark data is manually curated to ensure high-quality ground truth. Our results show alignment between automated FactLens evaluators and human judgments, and we discuss the impact of sub-claim characteristics on the overall verification performance."
}
Markdown (Informal)
[FactLens: Benchmarking Fine-Grained Fact Verification](https://preview.aclanthology.org/ingestion-acl-25/2025.findings-acl.929/) (Mitra et al., Findings 2025)
ACL
- Kushan Mitra, Dan Zhang, Sajjadur Rahman, and Estevam Hruschka. 2025. FactLens: Benchmarking Fine-Grained Fact Verification. In Findings of the Association for Computational Linguistics: ACL 2025, pages 18085–18096, Vienna, Austria. Association for Computational Linguistics.