@inproceedings{saioni-giannone-2024-multimodal,
title = "Multimodal Attention Is All You Need",
author = "Saioni, Marco and
Giannone, Cristina",
editor = "Dell'Orletta, Felice and
Lenci, Alessandro and
Montemagni, Simonetta and
Sprugnoli, Rachele",
booktitle = "Proceedings of the 10th Italian Conference on Computational Linguistics (CLiC-it 2024)",
month = dec,
year = "2024",
address = "Pisa, Italy",
publisher = "CEUR Workshop Proceedings",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.clicit-1.94/",
pages = "873--879",
ISBN = "979-12-210-7060-6",
abstract = "In this paper, we present a multimodal model for classifying fake news. The main peculiarity of the proposed model is the \textit{cross attention} mechanism. Cross-attention is an evolution of the attention mechanism that allows the model to examine intermodal relationships to better understand information from different modalities, enabling it to simultaneously focus on the relevant parts of the data extracted from each. We tested the model using \textit{MULTI-Fake-DetectiVE} data from Evalita 2023. The presented model is particularly effective in both the tasks of classifying fake news and evaluating the intermodal relationship."
}
Markdown (Informal)
[Multimodal Attention Is All You Need](https://preview.aclanthology.org/fix-sig-urls/2024.clicit-1.94/) (Saioni & Giannone, CLiC-it 2024)
ACL
- Marco Saioni and Cristina Giannone. 2024. Multimodal Attention Is All You Need. In Proceedings of the 10th Italian Conference on Computational Linguistics (CLiC-it 2024), pages 873–879, Pisa, Italy. CEUR Workshop Proceedings.