@inproceedings{raha-etal-2022-iiith,
title = "{IIITH} at {S}em{E}val-2022 Task 5: A comparative study of deep learning models for identifying misogynous memes",
author = "Raha, Tathagata and
Joshi, Sagar and
Varma, Vasudeva",
editor = "Emerson, Guy and
Schluter, Natalie and
Stanovsky, Gabriel and
Kumar, Ritesh and
Palmer, Alexis and
Schneider, Nathan and
Singh, Siddharth and
Ratan, Shyam",
booktitle = "Proceedings of the 16th International Workshop on Semantic Evaluation (SemEval-2022)",
month = jul,
year = "2022",
address = "Seattle, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.semeval-1.92/",
doi = "10.18653/v1/2022.semeval-1.92",
pages = "673--678",
abstract = "This paper provides a comparison of different deep learning methods for identifying misogynous memes for SemEval-2022 Task 5: Multimedia Automatic Misogyny Identification. In this task, we experiment with architectures in the identification of misogynous content in memes by making use of text and image-based information. The different deep learning methods compared in this paper are: (i) unimodal image or text models (ii) fusion of unimodal models (iii) multimodal transformers models and (iv) transformers further pretrained on a multimodal task. From our experiments, we found pretrained multimodal transformer architectures to strongly outperform the models involving the fusion of representation from both the modalities."
}
Markdown (Informal)
[IIITH at SemEval-2022 Task 5: A comparative study of deep learning models for identifying misogynous memes](https://preview.aclanthology.org/add-emnlp-2024-awards/2022.semeval-1.92/) (Raha et al., SemEval 2022)
ACL