@inproceedings{bailey-2010-data,
title = "Data Preparation for Machine Translation Customization",
author = "Bailey, Stacey",
booktitle = "Proceedings of the 9th Conference of the Association for Machine Translation in the Americas: Government MT User Program",
month = oct # " 31-" # nov # " 4",
year = "2010",
address = "Denver, Colorado, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2010.amta-government.14",
abstract = "The presentation will focus on ongoing work to develop sentence-aligned Chinese-English data for machine translation customization. Fully automatic alignment produces noisy data (e.g., containing OCR and alignment errors), and we are looking at the question of just how noisy noisy data can be and still produce translation improvements. Related, data clean-up efforts are time- and labor-intensive and we are examining whether translation improvements justify the clean-up costs.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="bailey-2010-data">
<titleInfo>
<title>Data Preparation for Machine Translation Customization</title>
</titleInfo>
<name type="personal">
<namePart type="given">Stacey</namePart>
<namePart type="family">Bailey</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2010-oct 31-nov 4</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 9th Conference of the Association for Machine Translation in the Americas: Government MT User Program</title>
</titleInfo>
<originInfo>
<publisher>Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">Denver, Colorado, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>The presentation will focus on ongoing work to develop sentence-aligned Chinese-English data for machine translation customization. Fully automatic alignment produces noisy data (e.g., containing OCR and alignment errors), and we are looking at the question of just how noisy noisy data can be and still produce translation improvements. Related, data clean-up efforts are time- and labor-intensive and we are examining whether translation improvements justify the clean-up costs.</abstract>
<identifier type="citekey">bailey-2010-data</identifier>
<location>
<url>https://aclanthology.org/2010.amta-government.14</url>
</location>
<part>
<date>2010-oct 31-nov 4</date>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Data Preparation for Machine Translation Customization
%A Bailey, Stacey
%S Proceedings of the 9th Conference of the Association for Machine Translation in the Americas: Government MT User Program
%D 2010
%8 oct 31 nov 4
%I Association for Machine Translation in the Americas
%C Denver, Colorado, USA
%F bailey-2010-data
%X The presentation will focus on ongoing work to develop sentence-aligned Chinese-English data for machine translation customization. Fully automatic alignment produces noisy data (e.g., containing OCR and alignment errors), and we are looking at the question of just how noisy noisy data can be and still produce translation improvements. Related, data clean-up efforts are time- and labor-intensive and we are examining whether translation improvements justify the clean-up costs.
%U https://aclanthology.org/2010.amta-government.14
Markdown (Informal)
[Data Preparation for Machine Translation Customization](https://aclanthology.org/2010.amta-government.14) (Bailey, AMTA 2010)
ACL
- Stacey Bailey. 2010. Data Preparation for Machine Translation Customization. In Proceedings of the 9th Conference of the Association for Machine Translation in the Americas: Government MT User Program, Denver, Colorado, USA. Association for Machine Translation in the Americas.