@inproceedings{pimpalkhute-etal-2021-iiitn,
title = "{IIITN} {NLP} at {SMM}4{H} 2021 Tasks: Transformer Models for Classification on Health-Related Imbalanced {T}witter Datasets",
author = "Pimpalkhute, Varad and
Nakhate, Prajwal and
Diwan, Tausif",
editor = "Magge, Arjun and
Klein, Ari and
Miranda-Escalada, Antonio and
Al-garadi, Mohammed Ali and
Alimova, Ilseyar and
Miftahutdinov, Zulfat and
Farre-Maduell, Eulalia and
Lopez, Salvador Lima and
Flores, Ivan and
O'Connor, Karen and
Weissenbacher, Davy and
Tutubalina, Elena and
Sarker, Abeed and
Banda, Juan M and
Krallinger, Martin and
Gonzalez-Hernandez, Graciela",
booktitle = "Proceedings of the Sixth Social Media Mining for Health ({\#}SMM4H) Workshop and Shared Task",
month = jun,
year = "2021",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2021.smm4h-1.24/",
doi = "10.18653/v1/2021.smm4h-1.24",
pages = "118--122",
abstract = "With increasing users sharing health-related information on social media, there has been a rise in using social media for health monitoring and surveillance. In this paper, we present a system that addresses classic health-related binary classification problems presented in Tasks 1a, 4, and 8 of the 6th edition of Social Media Mining for Health Applications (SMM4H) shared tasks. We developed a system based on RoBERTa (for Task 1a {\&} 4) and BioBERT (for Task 8). Furthermore, we address the challenge of the imbalanced dataset and propose techniques such as undersampling, oversampling, and data augmentation to overcome the imbalanced nature of a given health-related dataset."
}
Markdown (Informal)
[IIITN NLP at SMM4H 2021 Tasks: Transformer Models for Classification on Health-Related Imbalanced Twitter Datasets](https://preview.aclanthology.org/fix-sig-urls/2021.smm4h-1.24/) (Pimpalkhute et al., SMM4H 2021)
ACL