@inproceedings{wu-etal-2026-bidirectional,
title = "Bidirectional Semantic Enhancement for Schema Routing Across Large-Scale Databases",
author = "Wu, Yuyang and
Wang, Xiaoliang and
Nguyen, Cam-Tu",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.369/",
pages = "7495--7509",
ISBN = "979-8-89176-395-1",
abstract = "With the prevalence of Large Language Models (LLMs), Text-to-SQL has made significant progress, yet applying it to massive, real-world databases remains a challenge. While previous works adopt a retrieve-then-generate framework, they struggle with the profound semantic gap between user queries and vague schema definitions. Existing methods relying on unidirectional query expansion often fail to bridge lexical mismatches, while graph-based approaches struggle to navigate schemas when explicit structural links (e.g., foreign keys) are missing. To address this, we propose Bi-SR, a retrieval framework that bridges this gap through a bidirectional semantic enhancement strategy. We simultaneously enrich vague table schemas offline and perform online generative query expansion{---}specifically predicting potential schema structures{---}to align user intent. Crucially, we introduce a dual-augmented contrastive training objective for the dense retriever, which trains the dense retriever to recognize the semantic correspondence between the LLM-expanded query intent and the detailed schema descriptions. Experiments on massive schema routing benchmarks constructed from BIRD and Spider demonstrate that Bi-SR achieves state-of-the-art performance and significantly empowers smaller models for cost-effective deployment."
}Markdown (Informal)
[Bidirectional Semantic Enhancement for Schema Routing Across Large-Scale Databases](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.369/) (Wu et al., Findings 2026)
ACL