@inproceedings{danielsson-muhlenbock-2000-small,
title = "Small but efficient: the misconception of high-frequency words in {S}candinavian translation",
author = {Danielsson, Pernilla and
M{\"u}hlenbock, Katarina},
editor = "White, John S.",
booktitle = "Proceedings of the Fourth Conference of the Association for Machine Translation in the Americas: Technical Papers",
month = oct # " 10-14",
year = "2000",
address = "Cuernavaca, Mexico",
publisher = "Springer",
url = "https://link.springer.com/chapter/10.1007/3-540-39965-8_16",
pages = "158--168",
abstract = "Machine translation has proved itself to be easier between languages that are closely related, such as German and English, while far apart languages, such as Chinese and English, encounter much more problems. The present study focuses upon Swedish and Norwegian; two languages so closely related that they would be referred to as dialects if it were not for the fact that they had a Royal house and an army connected to each of them. Despite their similarity though, some differences make the translation phase much less straight-forward than what could be expected. Taking the outset in sentence aligned parallel texts, this study aims at highlighting some of the differences, and to formalise the results. In order to do so, the texts have been aligned on smaller units, by a simple cognate alignment method. Not at all surprising, the longer words were easier to align, while shorter and often high-frequent words became a problem. Also when trying to align to a specific word sense in a dictionary, content words rendered better results. Therefore, we abandoned the use of single-word units, and searched for multi-word units whenever possible. This study reinforces the view that Machine Translation should rest upon methods based on multiword unit searches.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="danielsson-muhlenbock-2000-small">
<titleInfo>
<title>Small but efficient: the misconception of high-frequency words in Scandinavian translation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Pernilla</namePart>
<namePart type="family">Danielsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Katarina</namePart>
<namePart type="family">Mühlenbock</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2000-oct 10-14</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Fourth Conference of the Association for Machine Translation in the Americas: Technical Papers</title>
</titleInfo>
<name type="personal">
<namePart type="given">John</namePart>
<namePart type="given">S</namePart>
<namePart type="family">White</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Springer</publisher>
<place>
<placeTerm type="text">Cuernavaca, Mexico</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Machine translation has proved itself to be easier between languages that are closely related, such as German and English, while far apart languages, such as Chinese and English, encounter much more problems. The present study focuses upon Swedish and Norwegian; two languages so closely related that they would be referred to as dialects if it were not for the fact that they had a Royal house and an army connected to each of them. Despite their similarity though, some differences make the translation phase much less straight-forward than what could be expected. Taking the outset in sentence aligned parallel texts, this study aims at highlighting some of the differences, and to formalise the results. In order to do so, the texts have been aligned on smaller units, by a simple cognate alignment method. Not at all surprising, the longer words were easier to align, while shorter and often high-frequent words became a problem. Also when trying to align to a specific word sense in a dictionary, content words rendered better results. Therefore, we abandoned the use of single-word units, and searched for multi-word units whenever possible. This study reinforces the view that Machine Translation should rest upon methods based on multiword unit searches.</abstract>
<identifier type="citekey">danielsson-muhlenbock-2000-small</identifier>
<location>
<url>https://link.springer.com/chapter/10.1007/3-540-39965-8_16</url>
</location>
<part>
<date>2000-oct 10-14</date>
<extent unit="page">
<start>158</start>
<end>168</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Small but efficient: the misconception of high-frequency words in Scandinavian translation
%A Danielsson, Pernilla
%A Mühlenbock, Katarina
%Y White, John S.
%S Proceedings of the Fourth Conference of the Association for Machine Translation in the Americas: Technical Papers
%D 2000
%8 oct 10 14
%I Springer
%C Cuernavaca, Mexico
%F danielsson-muhlenbock-2000-small
%X Machine translation has proved itself to be easier between languages that are closely related, such as German and English, while far apart languages, such as Chinese and English, encounter much more problems. The present study focuses upon Swedish and Norwegian; two languages so closely related that they would be referred to as dialects if it were not for the fact that they had a Royal house and an army connected to each of them. Despite their similarity though, some differences make the translation phase much less straight-forward than what could be expected. Taking the outset in sentence aligned parallel texts, this study aims at highlighting some of the differences, and to formalise the results. In order to do so, the texts have been aligned on smaller units, by a simple cognate alignment method. Not at all surprising, the longer words were easier to align, while shorter and often high-frequent words became a problem. Also when trying to align to a specific word sense in a dictionary, content words rendered better results. Therefore, we abandoned the use of single-word units, and searched for multi-word units whenever possible. This study reinforces the view that Machine Translation should rest upon methods based on multiword unit searches.
%U https://link.springer.com/chapter/10.1007/3-540-39965-8_16
%P 158-168
Markdown (Informal)
[Small but efficient: the misconception of high-frequency words in Scandinavian translation](https://link.springer.com/chapter/10.1007/3-540-39965-8_16) (Danielsson & Mühlenbock, AMTA 2000)
ACL