@inproceedings{ma-etal-2008-exploiting,
title = "Exploiting alignment techniques in {MATREX}: the {DCU} machine translation system for {IWSLT} 2008.",
author = "Ma, Yanjun and
Tinsley, John and
Hassan, Hany and
Du, Jinhua and
Way, Andy",
booktitle = "Proceedings of the 5th International Workshop on Spoken Language Translation: Evaluation Campaign",
month = oct # " 20-21",
year = "2008",
address = "Waikiki, Hawaii",
url = "https://aclanthology.org/2008.iwslt-evaluation.3",
pages = "26--33",
abstract = "In this paper, we give a description of the machine translation (MT) system developed at DCU that was used for our third participation in the evaluation campaign of the International Workshop on Spoken Language Translation (IWSLT 2008). In this participation, we focus on various techniques for word and phrase alignment to improve system quality. Specifically, we try out our word packing and syntax-enhanced word alignment techniques for the Chinese{--}English task and for the English{--}Chinese task for the first time. For all translation tasks except Arabic{--}English, we exploit linguistically motivated bilingual phrase pairs extracted from parallel treebanks. We smooth our translation tables with out-of-domain word translations for the Arabic{--}English and Chinese{--}English tasks in order to solve the problem of the high number of out of vocabulary items. We also carried out experiments combining both in-domain and out-of-domain data to improve system performance and, finally, we deploy a majority voting procedure combining a language model-based method and a translation-based method for case and punctuation restoration. We participated in all the translation tasks and translated both the single-best ASR hypotheses and the correct recognition results. The translation results confirm that our new word and phrase alignment techniques are often helpful in improving translation quality, and the data combination method we proposed can significantly improve system performance.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="ma-etal-2008-exploiting">
<titleInfo>
<title>Exploiting alignment techniques in MATREX: the DCU machine translation system for IWSLT 2008.</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yanjun</namePart>
<namePart type="family">Ma</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">John</namePart>
<namePart type="family">Tinsley</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hany</namePart>
<namePart type="family">Hassan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jinhua</namePart>
<namePart type="family">Du</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Andy</namePart>
<namePart type="family">Way</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2008-oct 20-21</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 5th International Workshop on Spoken Language Translation: Evaluation Campaign</title>
</titleInfo>
<originInfo>
<place>
<placeTerm type="text">Waikiki, Hawaii</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we give a description of the machine translation (MT) system developed at DCU that was used for our third participation in the evaluation campaign of the International Workshop on Spoken Language Translation (IWSLT 2008). In this participation, we focus on various techniques for word and phrase alignment to improve system quality. Specifically, we try out our word packing and syntax-enhanced word alignment techniques for the Chinese–English task and for the English–Chinese task for the first time. For all translation tasks except Arabic–English, we exploit linguistically motivated bilingual phrase pairs extracted from parallel treebanks. We smooth our translation tables with out-of-domain word translations for the Arabic–English and Chinese–English tasks in order to solve the problem of the high number of out of vocabulary items. We also carried out experiments combining both in-domain and out-of-domain data to improve system performance and, finally, we deploy a majority voting procedure combining a language model-based method and a translation-based method for case and punctuation restoration. We participated in all the translation tasks and translated both the single-best ASR hypotheses and the correct recognition results. The translation results confirm that our new word and phrase alignment techniques are often helpful in improving translation quality, and the data combination method we proposed can significantly improve system performance.</abstract>
<identifier type="citekey">ma-etal-2008-exploiting</identifier>
<location>
<url>https://aclanthology.org/2008.iwslt-evaluation.3</url>
</location>
<part>
<date>2008-oct 20-21</date>
<extent unit="page">
<start>26</start>
<end>33</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Exploiting alignment techniques in MATREX: the DCU machine translation system for IWSLT 2008.
%A Ma, Yanjun
%A Tinsley, John
%A Hassan, Hany
%A Du, Jinhua
%A Way, Andy
%S Proceedings of the 5th International Workshop on Spoken Language Translation: Evaluation Campaign
%D 2008
%8 oct 20 21
%C Waikiki, Hawaii
%F ma-etal-2008-exploiting
%X In this paper, we give a description of the machine translation (MT) system developed at DCU that was used for our third participation in the evaluation campaign of the International Workshop on Spoken Language Translation (IWSLT 2008). In this participation, we focus on various techniques for word and phrase alignment to improve system quality. Specifically, we try out our word packing and syntax-enhanced word alignment techniques for the Chinese–English task and for the English–Chinese task for the first time. For all translation tasks except Arabic–English, we exploit linguistically motivated bilingual phrase pairs extracted from parallel treebanks. We smooth our translation tables with out-of-domain word translations for the Arabic–English and Chinese–English tasks in order to solve the problem of the high number of out of vocabulary items. We also carried out experiments combining both in-domain and out-of-domain data to improve system performance and, finally, we deploy a majority voting procedure combining a language model-based method and a translation-based method for case and punctuation restoration. We participated in all the translation tasks and translated both the single-best ASR hypotheses and the correct recognition results. The translation results confirm that our new word and phrase alignment techniques are often helpful in improving translation quality, and the data combination method we proposed can significantly improve system performance.
%U https://aclanthology.org/2008.iwslt-evaluation.3
%P 26-33
Markdown (Informal)
[Exploiting alignment techniques in MATREX: the DCU machine translation system for IWSLT 2008.](https://aclanthology.org/2008.iwslt-evaluation.3) (Ma et al., IWSLT 2008)
ACL