@inproceedings{kadusabe-etal-2025-dkitnlp,
title = "{DKITNLP} at {A}rch{EHR}-{QA} 2025: A Retrieval Augmented {LLM} Pipeline for Evidence-Based Patient Question Answering",
author = "Kadusabe, Provia and
Kaushik, Abhishek and
Lawless, Fiona",
editor = "Soni, Sarvesh and
Demner-Fushman, Dina",
booktitle = "BioNLP 2025 Shared Tasks",
month = aug,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/acl25-workshop-ingestion/2025.bionlp-share.20/",
pages = "165--170",
ISBN = "979-8-89176-276-3",
abstract = "This paper describes our submission for the BioNLP ACL 2025 Shared task on grounded Question Answering (QA) from Electronic Health Records (EHRs). The task aims to automatically generate answers to patients' health related questions that are grounded in the evidence from their clinical notes. We propose a two stage retrieval pipeline to identify relevant sentences to guide response generation by a Large Language Model (LLM). Specifically, our approach uses a BioBERT based bi-encoder for initial retrieval, followed by a re-ranking step using a fine-tuned cross-encoder to enhance retrieval precision. The final set of selected sentences serve as an input to Mistral 7B model which generates answers through few-shot prompting. Our approach achieves an overall score of 31.6 on the test set, outperforming a substantially larger baseline model LLaMA 3.3 70B (30.7), which demonstrates the effectiveness of retrieval-augmented generation for grounded QA."
}
Markdown (Informal)
[DKITNLP at ArchEHR-QA 2025: A Retrieval Augmented LLM Pipeline for Evidence-Based Patient Question Answering](https://preview.aclanthology.org/acl25-workshop-ingestion/2025.bionlp-share.20/) (Kadusabe et al., BioNLP 2025)
ACL