@inproceedings{chen-etal-2016-guided,
title = "Guided Alignment Training for Topic-Aware Neural Machine Translation",
author = "Chen, Wenhu and
Matusov, Evgeny and
Khadivi, Shahram and
Peter, Jan-Thorsten",
editor = "Green, Spence and
Schwartz, Lane",
booktitle = "Conferences of the Association for Machine Translation in the Americas: MT Researchers' Track",
month = oct # " 28 - " # nov # " 1",
year = "2016",
address = "Austin, TX, USA",
publisher = "The Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2016.amta-researchers.10",
pages = "121--134",
abstract = "In this paper, we propose an effective way for biasing the attention mechanism of a sequence-to-sequence neural machine translation (NMT) model towards the well-studied statistical word alignment models. We show that our novel guided alignment training approach improves translation quality on real-life e-commerce texts consisting of product titles and descriptions, overcoming the problems posed by many unknown words and a large type/token ratio. We also show that meta-data associated with input texts such as topic or category information can significantly improve translation quality when used as an additional signal to the decoder part of the network. With both novel features, the BLEU score of the NMT system on a product title set improves from 18.6 to 21.3{\%}. Even larger MT quality gains are obtained through domain adaptation of a general domain NMT system to e-commerce data. The developed NMT system also performs well on the IWSLT speech translation task, where an ensemble of four variant systems outperforms the phrase-based baseline by 2.1{\%} BLEU absolute.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="chen-etal-2016-guided">
<titleInfo>
<title>Guided Alignment Training for Topic-Aware Neural Machine Translation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Wenhu</namePart>
<namePart type="family">Chen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Evgeny</namePart>
<namePart type="family">Matusov</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Shahram</namePart>
<namePart type="family">Khadivi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jan-Thorsten</namePart>
<namePart type="family">Peter</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2016-oct 28 - nov 1</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Conferences of the Association for Machine Translation in the Americas: MT Researchers’ Track</title>
</titleInfo>
<name type="personal">
<namePart type="given">Spence</namePart>
<namePart type="family">Green</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lane</namePart>
<namePart type="family">Schwartz</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>The Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">Austin, TX, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we propose an effective way for biasing the attention mechanism of a sequence-to-sequence neural machine translation (NMT) model towards the well-studied statistical word alignment models. We show that our novel guided alignment training approach improves translation quality on real-life e-commerce texts consisting of product titles and descriptions, overcoming the problems posed by many unknown words and a large type/token ratio. We also show that meta-data associated with input texts such as topic or category information can significantly improve translation quality when used as an additional signal to the decoder part of the network. With both novel features, the BLEU score of the NMT system on a product title set improves from 18.6 to 21.3%. Even larger MT quality gains are obtained through domain adaptation of a general domain NMT system to e-commerce data. The developed NMT system also performs well on the IWSLT speech translation task, where an ensemble of four variant systems outperforms the phrase-based baseline by 2.1% BLEU absolute.</abstract>
<identifier type="citekey">chen-etal-2016-guided</identifier>
<location>
<url>https://aclanthology.org/2016.amta-researchers.10</url>
</location>
<part>
<date>2016-oct 28 - nov 1</date>
<extent unit="page">
<start>121</start>
<end>134</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Guided Alignment Training for Topic-Aware Neural Machine Translation
%A Chen, Wenhu
%A Matusov, Evgeny
%A Khadivi, Shahram
%A Peter, Jan-Thorsten
%Y Green, Spence
%Y Schwartz, Lane
%S Conferences of the Association for Machine Translation in the Americas: MT Researchers’ Track
%D 2016
%8 oct 28 nov 1
%I The Association for Machine Translation in the Americas
%C Austin, TX, USA
%F chen-etal-2016-guided
%X In this paper, we propose an effective way for biasing the attention mechanism of a sequence-to-sequence neural machine translation (NMT) model towards the well-studied statistical word alignment models. We show that our novel guided alignment training approach improves translation quality on real-life e-commerce texts consisting of product titles and descriptions, overcoming the problems posed by many unknown words and a large type/token ratio. We also show that meta-data associated with input texts such as topic or category information can significantly improve translation quality when used as an additional signal to the decoder part of the network. With both novel features, the BLEU score of the NMT system on a product title set improves from 18.6 to 21.3%. Even larger MT quality gains are obtained through domain adaptation of a general domain NMT system to e-commerce data. The developed NMT system also performs well on the IWSLT speech translation task, where an ensemble of four variant systems outperforms the phrase-based baseline by 2.1% BLEU absolute.
%U https://aclanthology.org/2016.amta-researchers.10
%P 121-134
Markdown (Informal)
[Guided Alignment Training for Topic-Aware Neural Machine Translation](https://aclanthology.org/2016.amta-researchers.10) (Chen et al., AMTA 2016)
ACL