@article{TACL831,
	author = {Yin, Wenpeng  and Schütze, Hinrich  and Xiang, Bing  and Zhou, Bowen },
	title = {ABCNN: Attention-Based Convolutional Neural Network for Modeling Sentence Pairs},
	journal = {Transactions of the Association for Computational Linguistics},
	volume = {4},
	year = {2016},
	keywords = {},
	abstract = {How to model a pair of sentences is a critical issue in manyNLP tasks such as answer selection (AS), paraphrase identification (PI) and textual entailment (TE). Most prior work (i) deals with one individual task by fine-tuning a specific system; (ii) models each sentence's representation separately, rarely considering the impact of the other sentence; or (iii) relies fully on manually designed, task-specific linguistic features. This work presents a general Attention Based Convolutional Neural Network (ABCNN) for modeling a pair of sentences. We make three contributions. (i) The ABCNN can be applied to a wide variety of tasks that require modeling of sentence pairs. (ii) We propose three attention schemes that integrate mutual influence between sentences into CNNs; thus, the representation of eachsentence takes into consideration its counterpart. Theseinterdependent sentence pair representations are morepowerful than isolated sentence representations. (iii)ABCNNs achieve state-of-the-art performance on AS, PI and TE tasks. We release code at: https://github.com/yinwenpeng/Answer_Selection.},
	issn = {2307-387X},
	url = {https://tacl2013.cs.columbia.edu/ojs/index.php/tacl/article/view/831},
	pages = {259--272}
}
