@inproceedings{wang-etal-2021-fine-grained,
title = "Fine-grained Semantic Alignment Network for Weakly Supervised Temporal Language Grounding",
author = "Wang, Yuechen and
Zhou, Wengang and
Li, Houqiang",
editor = "Moens, Marie-Francine and
Huang, Xuanjing and
Specia, Lucia and
Yih, Scott Wen-tau",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2021",
month = nov,
year = "2021",
address = "Punta Cana, Dominican Republic",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2021.findings-emnlp.9/",
doi = "10.18653/v1/2021.findings-emnlp.9",
pages = "89--99",
abstract = "Temporal language grounding (TLG) aims to localize a video segment in an untrimmed video based on a natural language description. To alleviate the expensive cost of manual annotations for temporal boundary labels,we are dedicated to the weakly supervised setting, where only video-level descriptions are provided for training. Most of the existing weakly supervised methods generate a candidate segment set and learn cross-modal alignment through a MIL-based framework. However, the temporal structure of the video as well as the complicated semantics in the sentence are lost during the learning. In this work, we propose a novel candidate-free framework: Fine-grained Semantic Alignment Network (FSAN), for weakly supervised TLG. Instead of view the sentence and candidate moments as a whole, FSAN learns token-by-clip cross-modal semantic alignment by an iterative cross-modal interaction module, generates a fine-grained cross-modal semantic alignment map, and performs grounding directly on top of the map. Extensive experiments are conducted on two widely-used benchmarks: ActivityNet-Captions, and DiDeMo, where our FSAN achieves state-of-the-art performance."
}
Markdown (Informal)
[Fine-grained Semantic Alignment Network for Weakly Supervised Temporal Language Grounding](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2021.findings-emnlp.9/) (Wang et al., Findings 2021)
ACL