@article{yin-etal-2016-abcnn,
title = "{ABCNN}: Attention-Based Convolutional Neural Network for Modeling Sentence Pairs",
author = {Yin, Wenpeng and
Sch{\"u}tze, Hinrich and
Xiang, Bing and
Zhou, Bowen},
editor = "Lee, Lillian and
Johnson, Mark and
Toutanova, Kristina",
journal = "Transactions of the Association for Computational Linguistics",
volume = "4",
year = "2016",
address = "Cambridge, MA",
publisher = "MIT Press",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/Q16-1019/",
doi = "10.1162/tacl_a_00097",
pages = "259--272",
abstract = "How to model a pair of sentences is a critical issue in many NLP tasks such as answer selection (AS), paraphrase identification (PI) and textual entailment (TE). Most prior work (i) deals with one individual task by fine-tuning a specific system; (ii) models each sentence`s representation separately, rarely considering the impact of the other sentence; or (iii) relies fully on manually designed, task-specific linguistic features. This work presents a general Attention Based Convolutional Neural Network (ABCNN) for modeling a pair of sentences. We make three contributions. (i) The ABCNN can be applied to a wide variety of tasks that require modeling of sentence pairs. (ii) We propose three attention schemes that integrate mutual influence between sentences into CNNs; thus, the representation of each sentence takes into consideration its counterpart. These interdependent sentence pair representations are more powerful than isolated sentence representations. (iii) ABCNNs achieve state-of-the-art performance on AS, PI and TE tasks. We release code at: \url{https://github.com/yinwenpeng/Answer_Selection}."
}
Markdown (Informal)
[ABCNN: Attention-Based Convolutional Neural Network for Modeling Sentence Pairs](https://preview.aclanthology.org/jlcl-multiple-ingestion/Q16-1019/) (Yin et al., TACL 2016)
ACL