@inproceedings{wang-etal-2021-knowledge-guided,
title = "Knowledge-Guided Paraphrase Identification",
author = "Wang, Haoyu and
Ma, Fenglong and
Wang, Yaqing and
Gao, Jing",
editor = "Moens, Marie-Francine and
Huang, Xuanjing and
Specia, Lucia and
Yih, Scott Wen-tau",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2021",
month = nov,
year = "2021",
address = "Punta Cana, Dominican Republic",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest_wac_2008/2021.findings-emnlp.72/",
doi = "10.18653/v1/2021.findings-emnlp.72",
pages = "843--853",
abstract = "Paraphrase identification (PI), a fundamental task in natural language processing, is to identify whether two sentences express the same or similar meaning, which is a binary classification problem. Recently, BERT-like pre-trained language models have been a popular choice for the frameworks of various PI models, but almost all existing methods consider general domain text. When these approaches are applied to a specific domain, existing models cannot make accurate predictions due to the lack of professional knowledge. In light of this challenge, we propose a novel framework, namely , which can leverage the external unstructured Wikipedia knowledge to accurately identify paraphrases. We propose to mine outline knowledge of concepts related to given sentences from Wikipedia via BM25 model. After retrieving related outline knowledge, makes predictions based on both the semantic information of two sentences and the outline knowledge. Besides, we propose a gating mechanism to aggregate the semantic information-based prediction and the knowledge-based prediction. Extensive experiments are conducted on two public datasets: PARADE (a computer science domain dataset) and clinicalSTS2019 (a biomedical domain dataset). The results show that the proposed outperforms state-of-the-art methods."
}
Markdown (Informal)
[Knowledge-Guided Paraphrase Identification](https://preview.aclanthology.org/ingest_wac_2008/2021.findings-emnlp.72/) (Wang et al., Findings 2021)
ACL
- Haoyu Wang, Fenglong Ma, Yaqing Wang, and Jing Gao. 2021. Knowledge-Guided Paraphrase Identification. In Findings of the Association for Computational Linguistics: EMNLP 2021, pages 843–853, Punta Cana, Dominican Republic. Association for Computational Linguistics.