@inproceedings{reeder-2006-direct,
title = "Direct Application of a Language Learner Test to {MT} Evaluation",
author = "Reeder, Florence",
booktitle = "Proceedings of the 7th Conference of the Association for Machine Translation in the Americas: Technical Papers",
month = aug # " 8-12",
year = "2006",
address = "Cambridge, Massachusetts, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2006.amta-papers.19",
pages = "166--175",
abstract = "This paper shows the applicability of language testing techniques to machine translation (MT) evaluation through one of a set of related experiments. One straightforward experiment is to use language testing exams and scoring on MT output with little or no adaptation. This paper describes one such experiment, the first in a set. After an initial test (Vanni and Reeder, 2000), we expanded the experiment to include multiple raters and a more detailed analysis of the surprising results. Namely that unlike with humans, MT systems perform more poorly at both level zero and one than at level two and three. This paper presents these results as an illustration of both the applicability of language testing techniques and also the caution that needs to be applied.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="reeder-2006-direct">
<titleInfo>
<title>Direct Application of a Language Learner Test to MT Evaluation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Florence</namePart>
<namePart type="family">Reeder</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2006-aug 8-12</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 7th Conference of the Association for Machine Translation in the Americas: Technical Papers</title>
</titleInfo>
<originInfo>
<publisher>Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">Cambridge, Massachusetts, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper shows the applicability of language testing techniques to machine translation (MT) evaluation through one of a set of related experiments. One straightforward experiment is to use language testing exams and scoring on MT output with little or no adaptation. This paper describes one such experiment, the first in a set. After an initial test (Vanni and Reeder, 2000), we expanded the experiment to include multiple raters and a more detailed analysis of the surprising results. Namely that unlike with humans, MT systems perform more poorly at both level zero and one than at level two and three. This paper presents these results as an illustration of both the applicability of language testing techniques and also the caution that needs to be applied.</abstract>
<identifier type="citekey">reeder-2006-direct</identifier>
<location>
<url>https://aclanthology.org/2006.amta-papers.19</url>
</location>
<part>
<date>2006-aug 8-12</date>
<extent unit="page">
<start>166</start>
<end>175</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Direct Application of a Language Learner Test to MT Evaluation
%A Reeder, Florence
%S Proceedings of the 7th Conference of the Association for Machine Translation in the Americas: Technical Papers
%D 2006
%8 aug 8 12
%I Association for Machine Translation in the Americas
%C Cambridge, Massachusetts, USA
%F reeder-2006-direct
%X This paper shows the applicability of language testing techniques to machine translation (MT) evaluation through one of a set of related experiments. One straightforward experiment is to use language testing exams and scoring on MT output with little or no adaptation. This paper describes one such experiment, the first in a set. After an initial test (Vanni and Reeder, 2000), we expanded the experiment to include multiple raters and a more detailed analysis of the surprising results. Namely that unlike with humans, MT systems perform more poorly at both level zero and one than at level two and three. This paper presents these results as an illustration of both the applicability of language testing techniques and also the caution that needs to be applied.
%U https://aclanthology.org/2006.amta-papers.19
%P 166-175
Markdown (Informal)
[Direct Application of a Language Learner Test to MT Evaluation](https://aclanthology.org/2006.amta-papers.19) (Reeder, AMTA 2006)
ACL