@inproceedings{chakravarthy-etal-2020-detecting,
title = "Detecting Entailment in Code-Mixed {H}indi-{E}nglish Conversations",
author = "Chakravarthy, Sharanya and
Umapathy, Anjana and
Black, Alan W",
editor = "Xu, Wei and
Ritter, Alan and
Baldwin, Tim and
Rahimi, Afshin",
booktitle = "Proceedings of the Sixth Workshop on Noisy User-generated Text (W-NUT 2020)",
month = nov,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.wnut-1.22/",
doi = "10.18653/v1/2020.wnut-1.22",
pages = "165--170",
abstract = "The presence of large-scale corpora for Natural Language Inference (NLI) has spurred deep learning research in this area, though much of this research has focused solely on monolingual data. Code-mixing is the intertwined usage of multiple languages, and is commonly seen in informal conversations among polyglots. Given the rising importance of dialogue agents, it is imperative that they understand code-mixing, but the scarcity of code-mixed Natural Language Understanding (NLU) datasets has precluded research in this area. The dataset by Khanuja et. al. for detecting conversational entailment in code-mixed Hindi-English text is the first of its kind. We investigate the effectiveness of language modeling, data augmentation, translation, and architectural approaches to address the code-mixed, conversational, and low-resource aspects of this dataset. We obtain an 8.09{\%} increase in test set accuracy over the current state of the art."
}
Markdown (Informal)
[Detecting Entailment in Code-Mixed Hindi-English Conversations](https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.wnut-1.22/) (Chakravarthy et al., WNUT 2020)
ACL