@inproceedings{lin-etal-2004-extraction,
title = "Extraction of name and transliteration in monolingual and parallel corpora",
author = "Lin, Tracy and
Wu, Jian-Cheng and
Chang, Jason S.",
editor = "Frederking, Robert E. and
Taylor, Kathryn B.",
booktitle = "Proceedings of the 6th Conference of the Association for Machine Translation in the Americas: Technical Papers",
month = sep # " 28 - " # oct # " 2",
year = "2004",
address = "Washington, USA",
publisher = "Springer",
url = "https://link.springer.com/chapter/10.1007/978-3-540-30194-3_20",
pages = "177--186",
abstract = "Named-entities in free text represent a challenge to text analysis in Machine Translation and Cross Language Information Retrieval. These phrases are often transliterated into another language with a different sound inventory and writing system. Named-entities found in free text are often not listed in bilingual dictionaries. Although it is possible to identify and translate named-entities on the fly without a list of proper names and transliterations, an extensive list of existing transliterations certainly will ensure high precision rate. We use a seed list of proper names and transliterations to train a Machine Transliteration Model. With the model it is possible to extract proper names and their transliterations in monolingual or parallel corpora with high precision and recall rates.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="lin-etal-2004-extraction">
<titleInfo>
<title>Extraction of name and transliteration in monolingual and parallel corpora</title>
</titleInfo>
<name type="personal">
<namePart type="given">Tracy</namePart>
<namePart type="family">Lin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jian-Cheng</namePart>
<namePart type="family">Wu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jason</namePart>
<namePart type="given">S</namePart>
<namePart type="family">Chang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2004-sep 28 - oct 2</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 6th Conference of the Association for Machine Translation in the Americas: Technical Papers</title>
</titleInfo>
<name type="personal">
<namePart type="given">Robert</namePart>
<namePart type="given">E</namePart>
<namePart type="family">Frederking</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kathryn</namePart>
<namePart type="given">B</namePart>
<namePart type="family">Taylor</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Springer</publisher>
<place>
<placeTerm type="text">Washington, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Named-entities in free text represent a challenge to text analysis in Machine Translation and Cross Language Information Retrieval. These phrases are often transliterated into another language with a different sound inventory and writing system. Named-entities found in free text are often not listed in bilingual dictionaries. Although it is possible to identify and translate named-entities on the fly without a list of proper names and transliterations, an extensive list of existing transliterations certainly will ensure high precision rate. We use a seed list of proper names and transliterations to train a Machine Transliteration Model. With the model it is possible to extract proper names and their transliterations in monolingual or parallel corpora with high precision and recall rates.</abstract>
<identifier type="citekey">lin-etal-2004-extraction</identifier>
<location>
<url>https://link.springer.com/chapter/10.1007/978-3-540-30194-3_20</url>
</location>
<part>
<date>2004-sep 28 - oct 2</date>
<extent unit="page">
<start>177</start>
<end>186</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Extraction of name and transliteration in monolingual and parallel corpora
%A Lin, Tracy
%A Wu, Jian-Cheng
%A Chang, Jason S.
%Y Frederking, Robert E.
%Y Taylor, Kathryn B.
%S Proceedings of the 6th Conference of the Association for Machine Translation in the Americas: Technical Papers
%D 2004
%8 sep 28 oct 2
%I Springer
%C Washington, USA
%F lin-etal-2004-extraction
%X Named-entities in free text represent a challenge to text analysis in Machine Translation and Cross Language Information Retrieval. These phrases are often transliterated into another language with a different sound inventory and writing system. Named-entities found in free text are often not listed in bilingual dictionaries. Although it is possible to identify and translate named-entities on the fly without a list of proper names and transliterations, an extensive list of existing transliterations certainly will ensure high precision rate. We use a seed list of proper names and transliterations to train a Machine Transliteration Model. With the model it is possible to extract proper names and their transliterations in monolingual or parallel corpora with high precision and recall rates.
%U https://link.springer.com/chapter/10.1007/978-3-540-30194-3_20
%P 177-186
Markdown (Informal)
[Extraction of name and transliteration in monolingual and parallel corpora](https://link.springer.com/chapter/10.1007/978-3-540-30194-3_20) (Lin et al., AMTA 2004)
ACL