@inproceedings{liu-etal-2024-hit,
title = "{HIT}-{MI}{\&}{T} Lab at {S}em{E}val-2024 Task 6: {D}e{BERT}a-based Entailment Model is a Reliable Hallucination Detector",
author = "Liu, Wei and
Shi, Wanyao and
Zhang, Zijian and
Huang, Hui",
editor = {Ojha, Atul Kr. and
Do{\u{g}}ru{\"o}z, A. Seza and
Tayyar Madabushi, Harish and
Da San Martino, Giovanni and
Rosenthal, Sara and
Ros{\'a}, Aiala},
booktitle = "Proceedings of the 18th International Workshop on Semantic Evaluation (SemEval-2024)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.semeval-1.253/",
doi = "10.18653/v1/2024.semeval-1.253",
pages = "1788--1797",
abstract = "This paper describes our submission for SemEval-2024 Task 6: SHROOM, a Shared-task on Hallucinations and Related Observable Overgeneration Mistakes. We propose four groups of methods for hallucination detection: 1) Entailment Recognition; 2) Similarity Search; 3) Factuality Verification; 4) Confidence Estimation. The four methods rely on either the semantic relationship between the hypothesis and its source (target) or on the model-aware features during decoding. We participated in both the model-agnostic and model-aware tracks. Our method{'}s effectiveness is validated by our high rankings 3rd in the model-agnostic track and 5th in the model-aware track. We have released our code on GitHub."
}
Markdown (Informal)
[HIT-MI&T Lab at SemEval-2024 Task 6: DeBERTa-based Entailment Model is a Reliable Hallucination Detector](https://preview.aclanthology.org/fix-sig-urls/2024.semeval-1.253/) (Liu et al., SemEval 2024)
ACL