@inproceedings{rao-etal-2024-matchtime,
title = "{M}atch{T}ime: Towards Automatic Soccer Game Commentary Generation",
author = "Rao, Jiayuan and
Wu, Haoning and
Liu, Chang and
Wang, Yanfeng and
Xie, Weidi",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.emnlp-main.99/",
doi = "10.18653/v1/2024.emnlp-main.99",
pages = "1671--1685",
abstract = "Soccer is a globally popular sport with a vast audience, in this paper, we consider constructing an automatic soccer game commentary model to improve the audiences' viewing experience. In general, we make the following contributions: *First*, observing the prevalent video-text misalignment in existing datasets, we manually annotate timestamps for 49 matches, establishing a more robust benchmark for soccer game commentary generation, termed as *SN-Caption-test-align*; *Second*, we propose a multi-modal temporal alignment pipeline to automatically correct and filter the existing dataset at scale, creating a higher-quality soccer game commentary dataset for training, denoted as *MatchTime*; *Third*, based on our curated dataset, we train an automatic commentary generation model, named **MatchVoice**. Extensive experiments and ablation studies have demonstrated the effectiveness of our alignment pipeline, and training model on the curated datasets achieves state-of-the-art performance for commentary generation, showcasing that better alignment can lead to significant performance improvements in downstream tasks."
}
Markdown (Informal)
[MatchTime: Towards Automatic Soccer Game Commentary Generation](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.emnlp-main.99/) (Rao et al., EMNLP 2024)
ACL