@inproceedings{yun-etal-2025-lilac,
title = "{LIL}a{C}: Late Interacting in Layered Component Graph for Open-domain Multimodal Multihop Retrieval",
author = "Yun, Joohyung and
Lee, Doyup and
Han, Wook-Shin",
editor = "Christodoulopoulos, Christos and
Chakraborty, Tanmoy and
Rose, Carolyn and
Peng, Violet",
booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-main.1037/",
pages = "20551--20570",
ISBN = "979-8-89176-332-6",
abstract = "Multimodal document retrieval aims to retrieve query-relevant components from documents composed of textual, tabular, and visual elements. An effective multimodal retriever needs to handle two main challenges: (1) mitigate the effect of irrelevant contents caused by fixed, single-granular retrieval units, and (2) support multihop reasoning by effectively capturing semantic relationships among components within and across documents. To address these challenges, we propose LILaC, a multimodal retrieval framework featuring two core innovations. First, we introduce a layered component graph, explicitly representing multimodal information at two layers{---}each representing coarse and fine granularity{---}facilitating efficient yet precise reasoning. Second, we develop a late-interaction-based subgraph retrieval method, an edge-based approach that initially identifies coarse-grained nodes for efficient candidate generation, then performs fine-grained reasoning via late interaction. Extensive experiments demonstrate that LILaC achieves state-of-the-art retrieval performance on all five benchmarks, notably without additional fine-tuning. We make the artifacts publicly available at github.com/joohyung00/lilac."
}Markdown (Informal)
[LILaC: Late Interacting in Layered Component Graph for Open-domain Multimodal Multihop Retrieval](https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-main.1037/) (Yun et al., EMNLP 2025)
ACL