@inproceedings{chowdhury-etal-2025-fact5,
title = "{FACT}5: A Novel Benchmark and Pipeline for Nuanced Fact-Checking of Complex Statements",
author = "Chowdhury, Shayan and
Fang, Sunny and
Muresan, Smaranda",
editor = "Akhtar, Mubashara and
Aly, Rami and
Christodoulopoulos, Christos and
Cocarascu, Oana and
Guo, Zhijiang and
Mittal, Arpit and
Schlichtkrull, Michael and
Thorne, James and
Vlachos, Andreas",
booktitle = "Proceedings of the Eighth Fact Extraction and VERification Workshop (FEVER)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/display_plenaries/2025.fever-1.8/",
pages = "101--117",
ISBN = "978-1-959429-53-1",
abstract = "Fact-checking complex statements is integral to combating misinformation, but manual approaches are time-consuming, while automated approaches often oversimplify truthfulness into binary classifications and rely on resource-intensive models. This paper introduces: (i) FACT5, a curated dataset of 150 real-world statements with five ordinal classes of truthfulness, designed to capture the nuanced nature of factual accuracy and (ii) an open-source end-to-end pipeline using large language models (LLMs) that decomposes statements into atomic claims, generates targeted questions, retrieves evidence from the web, and produces justified verdicts. We evaluate our pipeline on FACT5 using Mistral-7B-v0.3 and Google{'}s Gemini-1.5-Flash. Our findings demonstrate significant improvements over baseline LLM performance, with Mistral-7B showing a 71.9{\%} reduction in MSE for pass@3 evaluation. The FACT5 dataset, pipeline implementation, and evaluation framework are anonymized and provided at https://github.com/shayantist/FACT5/, and a demo of the pipeline can be interacted with at https://fact5check.streamlit.app/."
}
Markdown (Informal)
[FACT5: A Novel Benchmark and Pipeline for Nuanced Fact-Checking of Complex Statements](https://preview.aclanthology.org/display_plenaries/2025.fever-1.8/) (Chowdhury et al., FEVER 2025)
ACL