@inproceedings{singh-2012-addressing,
title = "Addressing some Issues of Data Sparsity towards Improving {E}nglish- {M}anipuri {SMT} using Morphological Information",
author = "Singh, Thoudam Doren",
editor = "Okita, Tsuyoshi and
Sokolov, Artem and
Watanabe, Taro",
booktitle = "Workshop on Monolingual Machine Translation",
month = oct # " 28-" # nov # " 1",
year = "2012",
address = "San Diego, California, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2012.amta-monomt.6",
abstract = "The performance of an SMT system heavily depends on the availability of large parallel corpora. Unavailability of these resources in the required amount for many language pair is a challenging issue. The required size of the resource involving morphologically rich and highly agglutinative language is essentially much more for the SMT systems. This paper investigates on some of the issues on enriching the resource for this kind of languages. Handling of inflectional and derivational morphemes of the morphologically rich target language plays important role in the enrichment process. Mapping from the source to the target side is carried out for the English-Manipuri SMT task using factored model. The SMT system developed shows improvement in the performance both in terms of the automatic scoring and subjective evaluation over the baseline system.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="singh-2012-addressing">
<titleInfo>
<title>Addressing some Issues of Data Sparsity towards Improving English- Manipuri SMT using Morphological Information</title>
</titleInfo>
<name type="personal">
<namePart type="given">Thoudam</namePart>
<namePart type="given">Doren</namePart>
<namePart type="family">Singh</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2012-oct 28-nov 1</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Workshop on Monolingual Machine Translation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Tsuyoshi</namePart>
<namePart type="family">Okita</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Artem</namePart>
<namePart type="family">Sokolov</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Taro</namePart>
<namePart type="family">Watanabe</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">San Diego, California, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>The performance of an SMT system heavily depends on the availability of large parallel corpora. Unavailability of these resources in the required amount for many language pair is a challenging issue. The required size of the resource involving morphologically rich and highly agglutinative language is essentially much more for the SMT systems. This paper investigates on some of the issues on enriching the resource for this kind of languages. Handling of inflectional and derivational morphemes of the morphologically rich target language plays important role in the enrichment process. Mapping from the source to the target side is carried out for the English-Manipuri SMT task using factored model. The SMT system developed shows improvement in the performance both in terms of the automatic scoring and subjective evaluation over the baseline system.</abstract>
<identifier type="citekey">singh-2012-addressing</identifier>
<location>
<url>https://aclanthology.org/2012.amta-monomt.6</url>
</location>
<part>
<date>2012-oct 28-nov 1</date>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Addressing some Issues of Data Sparsity towards Improving English- Manipuri SMT using Morphological Information
%A Singh, Thoudam Doren
%Y Okita, Tsuyoshi
%Y Sokolov, Artem
%Y Watanabe, Taro
%S Workshop on Monolingual Machine Translation
%D 2012
%8 oct 28 nov 1
%I Association for Machine Translation in the Americas
%C San Diego, California, USA
%F singh-2012-addressing
%X The performance of an SMT system heavily depends on the availability of large parallel corpora. Unavailability of these resources in the required amount for many language pair is a challenging issue. The required size of the resource involving morphologically rich and highly agglutinative language is essentially much more for the SMT systems. This paper investigates on some of the issues on enriching the resource for this kind of languages. Handling of inflectional and derivational morphemes of the morphologically rich target language plays important role in the enrichment process. Mapping from the source to the target side is carried out for the English-Manipuri SMT task using factored model. The SMT system developed shows improvement in the performance both in terms of the automatic scoring and subjective evaluation over the baseline system.
%U https://aclanthology.org/2012.amta-monomt.6
Markdown (Informal)
[Addressing some Issues of Data Sparsity towards Improving English- Manipuri SMT using Morphological Information](https://aclanthology.org/2012.amta-monomt.6) (Singh, AMTA 2012)
ACL