@inproceedings{bouziane-etal-2026-candidate,
title = "Candidate-Aware Retrieval and Reranking for Multiple-Choice Question Answering: {A}rabic as a Case Study",
author = "Bouziane, Yassine and
Moukafih, Youness and
Ghogho, Mounir",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.435/",
pages = "8967--8977",
ISBN = "979-8-89176-395-1",
abstract = "Large language models (LLMs) have recently achieved impressive results on multiple-choice question answering (MCQA), with retrieval-augmented generation (RAG) emerging as an effective strategy for improving the performance of smaller models. However, existing RAG formulations face persistent challenges: retrieving too many passages often introduces noise, and even when relevant content is retrieved, models may still struggle with partially relevant or conflicting information. Moreover, while LLMs perform strongly on English benchmarks, their accuracy declines substantially on Arabic multi-task evaluations, revealing ongoing issues in cross-lingual transfer and domain adaptation. In this paper, we propose a novel approach, using Arabic as a representative case study, that jointly models the relevance of both the question and its candidate answers when selecting contextual passages. The method employs a lightweight reranker trained with a hybrid regression{--}triplet loss objective to identify passages that provide discriminative and reliable evidence. Extensive experiments across multiple model sizes and humanities domains show that our approach consistently outperforms both standard RAG baselines and reranker baselines, delivering two- to threefold improvements while remaining competitive with considerably larger models."
}Markdown (Informal)
[Candidate-Aware Retrieval and Reranking for Multiple-Choice Question Answering: Arabic as a Case Study](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.435/) (Bouziane et al., Findings 2026)
ACL