@inproceedings{huang-etal-2026-structure,
title = "Structure-Aware Quantized Retrieval for Long-Document Question Answering",
author = "Huang, Hui and
Velcin, Julien and
Kessaci, Yacine",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.209/",
pages = "4291--4304",
ISBN = "979-8-89176-395-1",
abstract = "Long-document question answering is challenging because relevant evidence is often scattered across distant sections. Traditional long-document QA/RAG pipelines often suffer from context fragmentation, retrieving locally plausible but structurally misaligned passages. We present the Hierarchical Quantized Document \textbf{R}etriever (HQDR), a framework that aligns hierarchical graph representations with a universal token vocabulary and integrates explicit structure into retrieval. By grounding continuous structural features in a fixed, discrete semantic space, HQDR captures universal hierarchical patterns rather than overfitting to specific layouts. We further propose a hybrid scoring mechanism that decouples semantic matching from structural alignment. Extensive experiments on QASPER and Natural Questions demonstrate that HQDR achieves consistent gains over strong baselines and exhibits superior robustness when transferring between datasets with distinct structural characteristics."
}Markdown (Informal)
[Structure-Aware Quantized Retrieval for Long-Document Question Answering](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.209/) (Huang et al., Findings 2026)
ACL