@inproceedings{kutsumi-etal-2005-selection,
title = "Selection of Entries for a Bilingual Dictionary from Aligned Translation Equivalents using Support Vector Machines",
author = "Kutsumi, Takeshi and
Yoshimi, Takehiko and
Kotani, Katsunori and
Sata, Ichiko and
Isahara, Hitoshi",
booktitle = "Proceedings of Machine Translation Summit X: Papers",
month = sep # " 13-15",
year = "2005",
address = "Phuket, Thailand",
url = "https://aclanthology.org/2005.mtsummit-papers.2/",
pages = "11--16",
abstract = "This paper claims that constructing a dictionary using bilingual pairs obtained from parallel corpora needs not only correct alignment of two noun phrases but also judgment of its appropriateness as an entry. It specifically addresses the latter task, which has been paid little attention. It demonstrates a method of selecting a suitable entry using Support Vector Machines, and proposes to regard as the features the common and the different parts between a current translation and a new translation. Using experiment results, this paper examines how selection performances are affected by the four ways of representing the common and the different parts: morphemes, parts of speech, semantic markers, and upper-level semantic markers. Moreover, we used n-grams of the common and the different parts of above four kinds of features. Experimental result found that representation by morphemes marked the best performance, F-measure of 0.803."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="kutsumi-etal-2005-selection">
<titleInfo>
<title>Selection of Entries for a Bilingual Dictionary from Aligned Translation Equivalents using Support Vector Machines</title>
</titleInfo>
<name type="personal">
<namePart type="given">Takeshi</namePart>
<namePart type="family">Kutsumi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Takehiko</namePart>
<namePart type="family">Yoshimi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Katsunori</namePart>
<namePart type="family">Kotani</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ichiko</namePart>
<namePart type="family">Sata</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hitoshi</namePart>
<namePart type="family">Isahara</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2005-sep 13-15</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of Machine Translation Summit X: Papers</title>
</titleInfo>
<originInfo>
<place>
<placeTerm type="text">Phuket, Thailand</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper claims that constructing a dictionary using bilingual pairs obtained from parallel corpora needs not only correct alignment of two noun phrases but also judgment of its appropriateness as an entry. It specifically addresses the latter task, which has been paid little attention. It demonstrates a method of selecting a suitable entry using Support Vector Machines, and proposes to regard as the features the common and the different parts between a current translation and a new translation. Using experiment results, this paper examines how selection performances are affected by the four ways of representing the common and the different parts: morphemes, parts of speech, semantic markers, and upper-level semantic markers. Moreover, we used n-grams of the common and the different parts of above four kinds of features. Experimental result found that representation by morphemes marked the best performance, F-measure of 0.803.</abstract>
<identifier type="citekey">kutsumi-etal-2005-selection</identifier>
<location>
<url>https://aclanthology.org/2005.mtsummit-papers.2/</url>
</location>
<part>
<date>2005-sep 13-15</date>
<extent unit="page">
<start>11</start>
<end>16</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Selection of Entries for a Bilingual Dictionary from Aligned Translation Equivalents using Support Vector Machines
%A Kutsumi, Takeshi
%A Yoshimi, Takehiko
%A Kotani, Katsunori
%A Sata, Ichiko
%A Isahara, Hitoshi
%S Proceedings of Machine Translation Summit X: Papers
%D 2005
%8 sep 13 15
%C Phuket, Thailand
%F kutsumi-etal-2005-selection
%X This paper claims that constructing a dictionary using bilingual pairs obtained from parallel corpora needs not only correct alignment of two noun phrases but also judgment of its appropriateness as an entry. It specifically addresses the latter task, which has been paid little attention. It demonstrates a method of selecting a suitable entry using Support Vector Machines, and proposes to regard as the features the common and the different parts between a current translation and a new translation. Using experiment results, this paper examines how selection performances are affected by the four ways of representing the common and the different parts: morphemes, parts of speech, semantic markers, and upper-level semantic markers. Moreover, we used n-grams of the common and the different parts of above four kinds of features. Experimental result found that representation by morphemes marked the best performance, F-measure of 0.803.
%U https://aclanthology.org/2005.mtsummit-papers.2/
%P 11-16
Markdown (Informal)
[Selection of Entries for a Bilingual Dictionary from Aligned Translation Equivalents using Support Vector Machines](https://aclanthology.org/2005.mtsummit-papers.2/) (Kutsumi et al., MTSummit 2005)
ACL