@inproceedings{allen-etal-2024-shroom,
title = "{SHROOM}-{INDE}lab at {S}em{E}val-2024 Task 6: Zero- and Few-Shot {LLM}-Based Classification for Hallucination Detection",
author = "Allen, Bradley and
Polat, Fina and
Groth, Paul",
editor = {Ojha, Atul Kr. and
Do{\u{g}}ru{\"o}z, A. Seza and
Tayyar Madabushi, Harish and
Da San Martino, Giovanni and
Rosenthal, Sara and
Ros{\'a}, Aiala},
booktitle = "Proceedings of the 18th International Workshop on Semantic Evaluation (SemEval-2024)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.semeval-1.120/",
doi = "10.18653/v1/2024.semeval-1.120",
pages = "839--844",
abstract = "We describe the University of Amsterdam Intelligent Data Engineering Lab team{'}s entry for the SemEval-2024 Task 6 competition. The SHROOM-INDElab system builds on previous work on using prompt programming and in-context learning with large language models (LLMs) to build classifiers for hallucination detection, and extends that work through the incorporation of context-specific definition of task, role, and target concept, and automated generation of examples for use in a few-shot prompting approach. The resulting system achieved fourth-best and sixth-best performance in the model-agnostic track and model-aware tracks for Task 6, respectively, and evaluation using the validation sets showed that the system{'}s classification decisions were consistent with those of the crowdsourced human labelers. We further found that a zero-shot approach provided better accuracy than a few-shot approach using automatically generated examples. Code for the system described in this paper is available on Github."
}
Markdown (Informal)
[SHROOM-INDElab at SemEval-2024 Task 6: Zero- and Few-Shot LLM-Based Classification for Hallucination Detection](https://preview.aclanthology.org/fix-sig-urls/2024.semeval-1.120/) (Allen et al., SemEval 2024)
ACL