@inproceedings{li-etal-2023-joyful,
title = "Joyful: Joint Modality Fusion and Graph Contrastive Learning for Multimoda Emotion Recognition",
author = "Li, Dongyuan and
Wang, Yusong and
Funakoshi, Kotaro and
Okumura, Manabu",
editor = "Bouamor, Houda and
Pino, Juan and
Bali, Kalika",
booktitle = "Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2023",
address = "Singapore",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.emnlp-main.996/",
doi = "10.18653/v1/2023.emnlp-main.996",
pages = "16051--16069",
abstract = "Multimodal emotion recognition aims to recognize emotions for each utterance from multiple modalities, which has received increasing attention for its application in human-machine interaction. Current graph-based methods fail to simultaneously depict global contextual features and local diverse uni-modal features in a dialogue. Furthermore, with the number of graph layers increasing, they easily fall into over-smoothing. In this paper, we propose a method for joint modality fusion and graph contrastive learning for multimodal emotion recognition (Joyful), where multimodality fusion, contrastive learning, and emotion recognition are jointly optimized. Specifically, we first design a new multimodal fusion mechanism that can provide deep interaction and fusion between the global contextual and uni-modal specific features. Then, we introduce a graph contrastive learning framework with inter- and intra-view contrastive losses to learn more distinguishable representations for samples with different sentiments. Extensive experiments on three benchmark datasets indicate that Joyful achieved state-of-the-art (SOTA) performance compared with all baselines. Code is released on Github (https://anonymous.4open.science/r/MERC-7F88)."
}
Markdown (Informal)
[Joyful: Joint Modality Fusion and Graph Contrastive Learning for Multimoda Emotion Recognition](https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.emnlp-main.996/) (Li et al., EMNLP 2023)
ACL