@inproceedings{tian-etal-2023-dynamic,
title = "Dynamic Routing Transformer Network for Multimodal Sarcasm Detection",
author = "Tian, Yuan and
Xu, Nan and
Zhang, Ruike and
Mao, Wenji",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.acl-long.139/",
doi = "10.18653/v1/2023.acl-long.139",
pages = "2468--2480",
abstract = "Multimodal sarcasm detection is an important research topic in natural language processing and multimedia computing, and benefits a wide range of applications in multiple domains. Most existing studies regard the incongruity between image and text as the indicative clue in identifying multimodal sarcasm. To capture cross-modal incongruity, previous methods rely on fixed architectures in network design, which restricts the model from dynamically adjusting to diverse image-text pairs. Inspired by routing-based dynamic network, we model the dynamic mechanism in multimodal sarcasm detection and propose the Dynamic Routing Transformer Network (DynRT-Net). Our method utilizes dynamic paths to activate different routing transformer modules with hierarchical co-attention adapting to cross-modal incongruity. Experimental results on a public dataset demonstrate the effectiveness of our method compared to the state-of-the-art methods. Our codes are available at \url{https://github.com/TIAN-viola/DynRT}."
}
Markdown (Informal)
[Dynamic Routing Transformer Network for Multimodal Sarcasm Detection](https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.acl-long.139/) (Tian et al., ACL 2023)
ACL