@inproceedings{das-srihari-2024-compos,
title = "Compos Mentis at {S}em{E}val2024 Task6: A Multi-Faceted Role-based Large Language Model Ensemble to Detect Hallucination",
author = "Das, Souvik and
Srihari, Rohini",
editor = {Ojha, Atul Kr. and
Do{\u{g}}ru{\"o}z, A. Seza and
Tayyar Madabushi, Harish and
Da San Martino, Giovanni and
Rosenthal, Sara and
Ros{\'a}, Aiala},
booktitle = "Proceedings of the 18th International Workshop on Semantic Evaluation (SemEval-2024)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.semeval-1.208/",
doi = "10.18653/v1/2024.semeval-1.208",
pages = "1449--1454",
abstract = "Hallucinations in large language models (LLMs), where they generate fluent but factually incorrect outputs, pose challenges for applications requiring strict truthfulness. This work proposes a multi-faceted approach to detect such hallucinations across various language tasks. We leverage automatic data annotation using a proprietary LLM, fine-tuning of the Mistral-7B-instruct-v0.2 model on annotated and benchmark data, role-based and rationale-based prompting strategies, and an ensemble method combining different model outputs through majority voting. This comprehensive framework aims to improve the robustness and reliability of hallucination detection for LLM generations."
}
Markdown (Informal)
[Compos Mentis at SemEval2024 Task6: A Multi-Faceted Role-based Large Language Model Ensemble to Detect Hallucination](https://preview.aclanthology.org/fix-sig-urls/2024.semeval-1.208/) (Das & Srihari, SemEval 2024)
ACL