@inproceedings{park-etal-2017-building,
title = "Building a Better Bitext for Structurally Different Languages through Self-training",
author = {Park, Jungyeul and
Dugast, Lo{\"\i}c and
Hong, Jeen-Pyo and
Shin, Chang-Uk and
Cha, Jeong-Won},
editor = "Afli, Haithem and
Liu, Chao-Hong",
booktitle = "Proceedings of the First Workshop on Curation and Applications of Parallel and Comparable Corpora",
month = nov,
year = "2017",
address = "Taipei, Taiwan",
publisher = "Asian Federation of Natural Language Processing",
url = "https://aclanthology.org/W17-5601",
pages = "1--10",
abstract = "We propose a novel method to bootstrap the construction of parallel corpora for new pairs of structurally different languages. We do so by combining the use of a pivot language and self-training. A pivot language enables the use of existing translation models to bootstrap the alignment and a self-training procedure enables to achieve better alignment, both at the document and sentence level. We also propose several evaluation methods for the resulting alignment.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="park-etal-2017-building">
<titleInfo>
<title>Building a Better Bitext for Structurally Different Languages through Self-training</title>
</titleInfo>
<name type="personal">
<namePart type="given">Jungyeul</namePart>
<namePart type="family">Park</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Loïc</namePart>
<namePart type="family">Dugast</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jeen-Pyo</namePart>
<namePart type="family">Hong</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chang-Uk</namePart>
<namePart type="family">Shin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jeong-Won</namePart>
<namePart type="family">Cha</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2017-11</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the First Workshop on Curation and Applications of Parallel and Comparable Corpora</title>
</titleInfo>
<name type="personal">
<namePart type="given">Haithem</namePart>
<namePart type="family">Afli</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chao-Hong</namePart>
<namePart type="family">Liu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Asian Federation of Natural Language Processing</publisher>
<place>
<placeTerm type="text">Taipei, Taiwan</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We propose a novel method to bootstrap the construction of parallel corpora for new pairs of structurally different languages. We do so by combining the use of a pivot language and self-training. A pivot language enables the use of existing translation models to bootstrap the alignment and a self-training procedure enables to achieve better alignment, both at the document and sentence level. We also propose several evaluation methods for the resulting alignment.</abstract>
<identifier type="citekey">park-etal-2017-building</identifier>
<location>
<url>https://aclanthology.org/W17-5601</url>
</location>
<part>
<date>2017-11</date>
<extent unit="page">
<start>1</start>
<end>10</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Building a Better Bitext for Structurally Different Languages through Self-training
%A Park, Jungyeul
%A Dugast, Loïc
%A Hong, Jeen-Pyo
%A Shin, Chang-Uk
%A Cha, Jeong-Won
%Y Afli, Haithem
%Y Liu, Chao-Hong
%S Proceedings of the First Workshop on Curation and Applications of Parallel and Comparable Corpora
%D 2017
%8 November
%I Asian Federation of Natural Language Processing
%C Taipei, Taiwan
%F park-etal-2017-building
%X We propose a novel method to bootstrap the construction of parallel corpora for new pairs of structurally different languages. We do so by combining the use of a pivot language and self-training. A pivot language enables the use of existing translation models to bootstrap the alignment and a self-training procedure enables to achieve better alignment, both at the document and sentence level. We also propose several evaluation methods for the resulting alignment.
%U https://aclanthology.org/W17-5601
%P 1-10
Markdown (Informal)
[Building a Better Bitext for Structurally Different Languages through Self-training](https://aclanthology.org/W17-5601) (Park et al., 2017)
ACL