@inproceedings{garg-etal-2022-multimodality,
title = "Multimodality for {NLP}-Centered Applications: Resources, Advances and Frontiers",
author = "Garg, Muskan and
Wazarkar, Seema and
Singh, Muskaan and
Bojar, Ond{\v{r}}ej",
editor = "Calzolari, Nicoletta and
B{\'e}chet, Fr{\'e}d{\'e}ric and
Blache, Philippe and
Choukri, Khalid and
Cieri, Christopher and
Declerck, Thierry and
Goggi, Sara and
Isahara, Hitoshi and
Maegaard, Bente and
Mariani, Joseph and
Mazo, H{\'e}l{\`e}ne and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Thirteenth Language Resources and Evaluation Conference",
month = jun,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.lrec-1.738/",
pages = "6837--6847",
abstract = "With the development of multimodal systems and natural language generation techniques, the resurgence of multimodal datasets has attracted significant research interests, which aims to provide new information to enrich the representation of textual data. However, there remains a lack of a comprehensive survey for this task. To this end, we take the first step and present a thorough review of this research field. This paper provides an overview of a publicly available dataset with different modalities according to the applications. Furthermore, we discuss the new frontier and give our thoughts. We hope this survey of multimodal datasets can provide the community with quick access and a general picture of the multimodal dataset for specific Natural Language Processing (NLP) applications and motivates future researches. In this context, we release the collection of all multimodal datasets easily accessible here: \url{https://github.com/drmuskangarg/Multimodal-datasets}"
}
Markdown (Informal)
[Multimodality for NLP-Centered Applications: Resources, Advances and Frontiers](https://preview.aclanthology.org/add-emnlp-2024-awards/2022.lrec-1.738/) (Garg et al., LREC 2022)
ACL