@inproceedings{mathur-etal-2018-offend,
title = "Did you offend me? Classification of Offensive Tweets in {H}inglish Language",
author = "Mathur, Puneet and
Sawhney, Ramit and
Ayyar, Meghna and
Shah, Rajiv",
editor = "Fi{\v{s}}er, Darja and
Huang, Ruihong and
Prabhakaran, Vinodkumar and
Voigt, Rob and
Waseem, Zeerak and
Wernimont, Jacqueline",
booktitle = "Proceedings of the 2nd Workshop on Abusive Language Online ({ALW}2)",
month = oct,
year = "2018",
address = "Brussels, Belgium",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/W18-5118/",
doi = "10.18653/v1/W18-5118",
pages = "138--148",
abstract = "The use of code-switched languages (\textit{e.g.}, Hinglish, which is derived by the blending of Hindi with the English language) is getting much popular on Twitter due to their ease of communication in native languages. However, spelling variations and absence of grammar rules introduce ambiguity and make it difficult to understand the text automatically. This paper presents the Multi-Input Multi-Channel Transfer Learning based model (MIMCT) to detect offensive (hate speech or abusive) Hinglish tweets from the proposed Hinglish Offensive Tweet (HOT) dataset using transfer learning coupled with multiple feature inputs. Specifically, it takes multiple primary word embedding along with secondary extracted features as inputs to train a multi-channel CNN-LSTM architecture that has been pre-trained on English tweets through transfer learning. The proposed MIMCT model outperforms the baseline supervised classification models, transfer learning based CNN and LSTM models to establish itself as the state of the art in the unexplored domain of Hinglish offensive text classification."
}
Markdown (Informal)
[Did you offend me? Classification of Offensive Tweets in Hinglish Language](https://preview.aclanthology.org/fix-sig-urls/W18-5118/) (Mathur et al., ALW 2018)
ACL