@inproceedings{li-etal-2025-automated,
title = "Automated Clinical Data Extraction with Knowledge Conditioned {LLM}s",
author = "Li, Diya and
Kadav, Asim and
Gao, Aijing and
Li, Rui and
Bourgon, Richard",
editor = "Rambow, Owen and
Wanner, Leo and
Apidianaki, Marianna and
Al-Khalifa, Hend and
Eugenio, Barbara Di and
Schockaert, Steven and
Darwish, Kareem and
Agarwal, Apoorv",
booktitle = "Proceedings of the 31st International Conference on Computational Linguistics: Industry Track",
month = jan,
year = "2025",
address = "Abu Dhabi, UAE",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2025.coling-industry.13/",
pages = "149--162",
abstract = "The extraction of lung lesion information from clinical and medical imaging reports is crucial for research on and clinical care of lung-related diseases. Large language models (LLMs) can be effective at interpreting unstructured text in reports, but they often hallucinate due to a lack of domain-specific knowledge, leading to reduced accuracy and posing challenges for use in clinical settings. To address this, we propose a novel framework that aligns generated internal knowledge with external knowledge through in-context learning (ICL). Our framework employs a retriever to identify relevant units of internal or external knowledge and a grader to evaluate the truthfulness and helpfulness of the retrieved internal-knowledge rules, to align and update the knowledge bases. Experiments with expert-curated test datasets demonstrate that this ICL approach can increase the F1 score for key fields (lesion size, margin and solidity) by an average of 12.9{\%} over existing ICL methods."
}
Markdown (Informal)
[Automated Clinical Data Extraction with Knowledge Conditioned LLMs](https://preview.aclanthology.org/add-emnlp-2024-awards/2025.coling-industry.13/) (Li et al., COLING 2025)
ACL