@inproceedings{bian-etal-2023-contrastive,
title = "Contrastive Distant Supervision for Debiased and Denoised Machine Reading Comprehension",
author = "Bian, Ning and
Lin, Hongyu and
Han, Xianpei and
He, Ben and
Sun, Le",
editor = "Bouamor, Houda and
Pino, Juan and
Bali, Kalika",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2023",
month = dec,
year = "2023",
address = "Singapore",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2023.findings-emnlp.457/",
doi = "10.18653/v1/2023.findings-emnlp.457",
pages = "6852--6863",
abstract = "Distant Supervision (DS) is a promising learning approach for MRC by leveraging easily-obtained question-answer pairs. Unfortunately, the heuristically annotated dataset will inevitably lead to mislabeled instances, resulting in answer bias and context noise problems. To learn debiased and denoised MRC models, this paper proposes the Contrastive Distant Supervision algorithm {--} CDS, which can learn to distinguish confusing and noisy instances via confidence-aware contrastive learning. Specifically, to eliminate answer bias, CDS samples counterfactual negative instances, which ensures that MRC models must take both answer information and question-context interaction into consideration. To denoise distantly annotated contexts, CDS samples confusing negative instances to increase the margin between correct and mislabeled instances. We further propose a confidence-aware contrastive loss to model and leverage the uncertainty of all DS instances during learning. Experimental results show that CDS is effective and can even outperform supervised MRC models without manual annotations."
}
Markdown (Informal)
[Contrastive Distant Supervision for Debiased and Denoised Machine Reading Comprehension](https://preview.aclanthology.org/fix-sig-urls/2023.findings-emnlp.457/) (Bian et al., Findings 2023)
ACL