@inproceedings{bond-etal-2008-improving,
title = "Improving statistical machine translation by paraphrasing the training data.",
author = "Bond, Francis and
Nichols, Eric and
Scott Appling, Darren and
Paul, Michael",
booktitle = "Proceedings of the 5th International Workshop on Spoken Language Translation: Papers",
month = oct # " 20-21",
year = "2008",
address = "Waikiki, Hawaii",
url = "https://aclanthology.org/2008.iwslt-papers.2",
pages = "150--157",
abstract = "Large amounts of training data are essential for training statistical machine translations systems. In this paper we show how training data can be expanded by paraphrasing one side. The new data is made by parsing then generating using a precise HPSG based grammar, which gives sentences with the same meaning, but minor variations in lexical choice and word order. In experiments with Japanese and English, we showed consistent gains on the Tanaka Corpus with less consistent improvement on the IWSLT 2005 evaluation data.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="bond-etal-2008-improving">
<titleInfo>
<title>Improving statistical machine translation by paraphrasing the training data.</title>
</titleInfo>
<name type="personal">
<namePart type="given">Francis</namePart>
<namePart type="family">Bond</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Eric</namePart>
<namePart type="family">Nichols</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Darren</namePart>
<namePart type="family">Scott Appling</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Michael</namePart>
<namePart type="family">Paul</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2008-oct 20-21</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 5th International Workshop on Spoken Language Translation: Papers</title>
</titleInfo>
<originInfo>
<place>
<placeTerm type="text">Waikiki, Hawaii</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Large amounts of training data are essential for training statistical machine translations systems. In this paper we show how training data can be expanded by paraphrasing one side. The new data is made by parsing then generating using a precise HPSG based grammar, which gives sentences with the same meaning, but minor variations in lexical choice and word order. In experiments with Japanese and English, we showed consistent gains on the Tanaka Corpus with less consistent improvement on the IWSLT 2005 evaluation data.</abstract>
<identifier type="citekey">bond-etal-2008-improving</identifier>
<location>
<url>https://aclanthology.org/2008.iwslt-papers.2</url>
</location>
<part>
<date>2008-oct 20-21</date>
<extent unit="page">
<start>150</start>
<end>157</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Improving statistical machine translation by paraphrasing the training data.
%A Bond, Francis
%A Nichols, Eric
%A Scott Appling, Darren
%A Paul, Michael
%S Proceedings of the 5th International Workshop on Spoken Language Translation: Papers
%D 2008
%8 oct 20 21
%C Waikiki, Hawaii
%F bond-etal-2008-improving
%X Large amounts of training data are essential for training statistical machine translations systems. In this paper we show how training data can be expanded by paraphrasing one side. The new data is made by parsing then generating using a precise HPSG based grammar, which gives sentences with the same meaning, but minor variations in lexical choice and word order. In experiments with Japanese and English, we showed consistent gains on the Tanaka Corpus with less consistent improvement on the IWSLT 2005 evaluation data.
%U https://aclanthology.org/2008.iwslt-papers.2
%P 150-157
Markdown (Informal)
[Improving statistical machine translation by paraphrasing the training data.](https://aclanthology.org/2008.iwslt-papers.2) (Bond et al., IWSLT 2008)
ACL