@inproceedings{mousavi-etal-2024-dyknow,
title = "{D}y{K}now: Dynamically Verifying Time-Sensitive Factual Knowledge in {LLM}s",
author = "Mousavi, Seyed Mahed and
Alghisi, Simone and
Riccardi, Giuseppe",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2024",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.findings-emnlp.471/",
doi = "10.18653/v1/2024.findings-emnlp.471",
pages = "8014--8029",
abstract = "LLMs acquire knowledge from massive data snapshots collected at different timestamps. Their knowledge is then commonly evaluated using static benchmarks. However, factual knowledge is generally subject to time-sensitive changes, and static benchmarks cannot address those cases. We present an approach to dynamically evaluate the knowledge in LLMs and their time-sensitiveness against Wikidata, a publicly available up-to-date knowledge graph. We evaluate the time-sensitive knowledge in twenty-four private and open-source LLMs, as well as the effectiveness of four editing methods in updating the outdated facts. Our results show that 1) outdatedness is a critical problem across state-of-the-art LLMs; 2) LLMs output inconsistent answers when prompted with slight variations of the question prompt; and 3) the performance of the state-of-the-art knowledge editing algorithms is very limited, as they can not reduce the cases of outdatedness and output inconsistency."
}
Markdown (Informal)
[DyKnow: Dynamically Verifying Time-Sensitive Factual Knowledge in LLMs](https://preview.aclanthology.org/fix-sig-urls/2024.findings-emnlp.471/) (Mousavi et al., Findings 2024)
ACL