@inproceedings{sourav-ouyang-2021-lightweight,
title = "Lightweight Models for Multimodal Sequential Data",
author = "Sourav, Soumya and
Ouyang, Jessica",
editor = "De Clercq, Orphee and
Balahur, Alexandra and
Sedoc, Joao and
Barriere, Valentin and
Tafreshi, Shabnam and
Buechel, Sven and
Hoste, Veronique",
booktitle = "Proceedings of the Eleventh Workshop on Computational Approaches to Subjectivity, Sentiment and Social Media Analysis",
month = apr,
year = "2021",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2021.wassa-1.14/",
pages = "129--137",
abstract = "Human language encompasses more than just text; it also conveys emotions through tone and gestures. We present a case study of three simple and efficient Transformer-based architectures for predicting sentiment and emotion in multimodal data. The Late Fusion model merges unimodal features to create a multimodal feature sequence, the Round Robin model iteratively combines bimodal features using cross-modal attention, and the Hybrid Fusion model combines trimodal and unimodal features together to form a final feature sequence for predicting sentiment. Our experiments show that our small models are effective and outperform the publicly released versions of much larger, state-of-the-art multimodal sentiment analysis systems."
}
Markdown (Informal)
[Lightweight Models for Multimodal Sequential Data](https://preview.aclanthology.org/add-emnlp-2024-awards/2021.wassa-1.14/) (Sourav & Ouyang, WASSA 2021)
ACL
- Soumya Sourav and Jessica Ouyang. 2021. Lightweight Models for Multimodal Sequential Data. In Proceedings of the Eleventh Workshop on Computational Approaches to Subjectivity, Sentiment and Social Media Analysis, pages 129–137, Online. Association for Computational Linguistics.