@inproceedings{mundt-etal-2012-learning,
title = "Learning to Automatically Post-Edit Dropped Words in {MT}",
author = "Mundt, Jacob and
Parton, Kristen and
McKeown, Kathleen",
editor = "O'Brien, Sharon and
Simard, Michel and
Specia, Lucia",
booktitle = "Workshop on Post-Editing Technology and Practice",
month = oct # " 28",
year = "2012",
address = "San Diego, California, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2012.amta-wptp.5",
abstract = "Automatic post-editors (APEs) can improve adequacy of MT output by detecting and reinserting dropped content words, but the location where these words are inserted is critical. In this paper, we describe a probabilistic approach for learning reinsertion rules for specific languages and MT systems, as well as a method for synthesizing training data from reference translations. We test the insertion logic on MT systems for Chinese to English and Arabic to English. Our adaptive APE is able to insert within 3 words of the best location 73{\%} of the time (32{\%} in the exact location) in Arabic-English MT output, and 67{\%} of the time in Chinese-English output (30{\%} in the exact location), and delivers improved performance on automated adequacy metrics over a previous rule-based approach to insertion. We consider how particular aspects of the insertion problem make it particularly amenable to machine learning solutions.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="mundt-etal-2012-learning">
<titleInfo>
<title>Learning to Automatically Post-Edit Dropped Words in MT</title>
</titleInfo>
<name type="personal">
<namePart type="given">Jacob</namePart>
<namePart type="family">Mundt</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kristen</namePart>
<namePart type="family">Parton</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kathleen</namePart>
<namePart type="family">McKeown</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2012-oct 28</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Workshop on Post-Editing Technology and Practice</title>
</titleInfo>
<name type="personal">
<namePart type="given">Sharon</namePart>
<namePart type="family">O’Brien</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Michel</namePart>
<namePart type="family">Simard</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lucia</namePart>
<namePart type="family">Specia</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">San Diego, California, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Automatic post-editors (APEs) can improve adequacy of MT output by detecting and reinserting dropped content words, but the location where these words are inserted is critical. In this paper, we describe a probabilistic approach for learning reinsertion rules for specific languages and MT systems, as well as a method for synthesizing training data from reference translations. We test the insertion logic on MT systems for Chinese to English and Arabic to English. Our adaptive APE is able to insert within 3 words of the best location 73% of the time (32% in the exact location) in Arabic-English MT output, and 67% of the time in Chinese-English output (30% in the exact location), and delivers improved performance on automated adequacy metrics over a previous rule-based approach to insertion. We consider how particular aspects of the insertion problem make it particularly amenable to machine learning solutions.</abstract>
<identifier type="citekey">mundt-etal-2012-learning</identifier>
<location>
<url>https://aclanthology.org/2012.amta-wptp.5</url>
</location>
<part>
<date>2012-oct 28</date>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Learning to Automatically Post-Edit Dropped Words in MT
%A Mundt, Jacob
%A Parton, Kristen
%A McKeown, Kathleen
%Y O’Brien, Sharon
%Y Simard, Michel
%Y Specia, Lucia
%S Workshop on Post-Editing Technology and Practice
%D 2012
%8 oct 28
%I Association for Machine Translation in the Americas
%C San Diego, California, USA
%F mundt-etal-2012-learning
%X Automatic post-editors (APEs) can improve adequacy of MT output by detecting and reinserting dropped content words, but the location where these words are inserted is critical. In this paper, we describe a probabilistic approach for learning reinsertion rules for specific languages and MT systems, as well as a method for synthesizing training data from reference translations. We test the insertion logic on MT systems for Chinese to English and Arabic to English. Our adaptive APE is able to insert within 3 words of the best location 73% of the time (32% in the exact location) in Arabic-English MT output, and 67% of the time in Chinese-English output (30% in the exact location), and delivers improved performance on automated adequacy metrics over a previous rule-based approach to insertion. We consider how particular aspects of the insertion problem make it particularly amenable to machine learning solutions.
%U https://aclanthology.org/2012.amta-wptp.5
Markdown (Informal)
[Learning to Automatically Post-Edit Dropped Words in MT](https://aclanthology.org/2012.amta-wptp.5) (Mundt et al., AMTA 2012)
ACL