@inproceedings{lee-etal-2025-shifting,
title = "Shifting from Ranking to Set Selection for Retrieval Augmented Generation",
author = "Lee, Dahyun and
Jo, Yongrae and
Park, Haeju and
Lee, Moontae",
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.861/",
pages = "17606--17619",
ISBN = "979-8-89176-251-0",
abstract = "Retrieval in Retrieval-Augmented Generation (RAG) must ensure that retrieved passages are not only individually relevant but also collectively form a comprehensive set.Existing approaches primarily rerank top-$k$ passages based on their individual relevance, often failing to meet the information needs of complex queries in multi-hop question answering.In this work, we propose a set-wise passage selection approach and introduce SetR, which explicitly identifies the information requirements of a query through Chain-of-Thought reasoning and selects an optimal set of passages that collectively satisfy those requirements.Experiments on multi-hop RAG benchmarks show that SetR outperforms both proprietary LLM-based rerankers and open-source baselines in terms of answer correctness and retrieval quality, providing an effective and efficient alternative to traditional rerankers in RAG systems.The code is available at https://github.com/LGAI-Research/SetR"
}
Markdown (Informal)
[Shifting from Ranking to Set Selection for Retrieval Augmented Generation](https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.861/) (Lee et al., ACL 2025)
ACL