@inproceedings{li-etal-2025-evaluating-performance,
title = "Evaluating the Performance of {RAG} Methods for Conversational {AI} in the Airport Domain",
author = {Li, Yuyang and
Kerbusch, Pjm and
Pruim, Rhr and
K{\"a}fer, Tobias},
editor = "Chen, Weizhu and
Yang, Yi and
Kachuee, Mohammad and
Fu, Xue-Yong",
booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 3: Industry Track)",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.naacl-industry.61/",
pages = "794--808",
ISBN = "979-8-89176-194-0",
abstract = "Airports from the top 20 in terms of annual passengers are highly dynamic environment with thousands of flights daily, and they aim to increase the degree of automation. To contribute to this, we implemented a Conversational AI system that enables staff in an airport to communicate with flight information systems. This system not only answers standard airport queries but also resolves airport terminology, jargon, abbreviations, and dynamic questions involving reasoning. In this paper, we built three different Retrieval-Augmented Generation (RAG) methods, including traditional RAG, SQL RAG, and Knowledge Graph-based RAG (Graph RAG). Experiments showed that traditional RAG achieved 84.84{\%} accuracy using BM25 + GPT-4 but occasionally produced hallucinations, which is risky to airport safety. In contrast, SQL RAG and Graph RAG achieved 80.85{\%} and 91.49{\%} accuracy respectively, with significantly fewer hallucinations. Moreover, Graph RAG was especially effective for questions that involved reasoning. Based on our observations, we thus recommend SQL RAG and Graph RAG are better for airport environments, due to fewer hallucinations and the ability to handle dynamic questions."
}
Markdown (Informal)
[Evaluating the Performance of RAG Methods for Conversational AI in the Airport Domain](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.naacl-industry.61/) (Li et al., NAACL 2025)
ACL