@inproceedings{park-etal-2026-enhancing,
title = "Enhancing Multilingual {RAG} Systems with Debiased Language Preference-Guided Query Fusion",
author = "Park, Jeonghyun and
Kim, Byeongjeong and
Hwang, Seojin and
Lee, Hwanhee",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1353/",
pages = "27116--27136",
ISBN = "979-8-89176-395-1",
abstract = "Multilingual Retrieval-Augmented Generation (mRAG) systems often exhibit a perceived preference for high-resource languages, particularly English, resulting in the widespread adoption of English pivoting. While prior studies attribute this advantage to the superior English-centric capabilities of Large Language Models (LLMs), we find that such measurements are significantly distorted by structural priors inherent in evaluation benchmarks. Specifically, we identify exposure bias and a gold availability prior{---}both driven by the disproportionate concentration of resources in English{---}as well as cultural priors rooted in topic locality, as factors that hinder accurate assessment of genuine language preference. To address these biases, we propose DeLP (Debiased Language Preference), a calibrated metric designed to explicitly factor out these structural confounds. Our analysis using DeLP reveals that the previously reported English preference is largely a byproduct of evidence distribution rather than an inherent model bias. Instead, we find that retrievers fundamentally favor monolingual alignment between the query and the document language. Building on this insight, we introduce DELTA (DEbiased Language preference{--}guided Text Augmentation), a lightweight and efficient mRAG framework that strategically leverages monolingual alignment to optimize cross-lingual retrieval and generation. Experimental results demonstrate that DELTA consistently outperforms English pivoting and mRAG baselines across diverse languages."
}Markdown (Informal)
[Enhancing Multilingual RAG Systems with Debiased Language Preference-Guided Query Fusion](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1353/) (Park et al., Findings 2026)
ACL