@inproceedings{jon-bojar-2024-analysis,
title = "An Analysis of Surprisal Uniformity in Machine and Human Translations",
author = "Jon, Josef and
Bojar, Ond{\v{r}}ej",
editor = "Vanroy, Bram and
Lefer, Marie-Aude and
Macken, Lieve and
Ruffo, Paola",
booktitle = "Proceedings of the 1st Workshop on Creative-text Translation and Technology",
month = jun,
year = "2024",
address = "Sheffield, United Kingdom",
publisher = "European Association for Machine Translation",
url = "https://aclanthology.org/2024.ctt-1.5",
pages = "40--56",
abstract = "This study examines neural machine translation (NMT) and its performance on texts that diverege from typical standards, focusing on how information is organized within sentences. We analyze surprisal distributions in source texts, human translations, and machine translations across several datasets to determine if NMT systems naturally promote a uniform density of surprisal in their translations, even when the original texts do not adhere to this principle.The findings reveal that NMT tends to align more closely with source texts in terms of surprisal uniformity compared to human translations.We analyzed absolute values of the surprisal uniformity measures as well, expecting that human translations will be less uniform. In contradiction to our initial hypothesis, we did not find comprehensive evidence for this claim, with some results suggesting this might be the case for very diverse texts, like poetry.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="jon-bojar-2024-analysis">
<titleInfo>
<title>An Analysis of Surprisal Uniformity in Machine and Human Translations</title>
</titleInfo>
<name type="personal">
<namePart type="given">Josef</namePart>
<namePart type="family">Jon</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ondřej</namePart>
<namePart type="family">Bojar</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2024-06</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 1st Workshop on Creative-text Translation and Technology</title>
</titleInfo>
<name type="personal">
<namePart type="given">Bram</namePart>
<namePart type="family">Vanroy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Marie-Aude</namePart>
<namePart type="family">Lefer</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lieve</namePart>
<namePart type="family">Macken</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Paola</namePart>
<namePart type="family">Ruffo</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>European Association for Machine Translation</publisher>
<place>
<placeTerm type="text">Sheffield, United Kingdom</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This study examines neural machine translation (NMT) and its performance on texts that diverege from typical standards, focusing on how information is organized within sentences. We analyze surprisal distributions in source texts, human translations, and machine translations across several datasets to determine if NMT systems naturally promote a uniform density of surprisal in their translations, even when the original texts do not adhere to this principle.The findings reveal that NMT tends to align more closely with source texts in terms of surprisal uniformity compared to human translations.We analyzed absolute values of the surprisal uniformity measures as well, expecting that human translations will be less uniform. In contradiction to our initial hypothesis, we did not find comprehensive evidence for this claim, with some results suggesting this might be the case for very diverse texts, like poetry.</abstract>
<identifier type="citekey">jon-bojar-2024-analysis</identifier>
<location>
<url>https://aclanthology.org/2024.ctt-1.5</url>
</location>
<part>
<date>2024-06</date>
<extent unit="page">
<start>40</start>
<end>56</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T An Analysis of Surprisal Uniformity in Machine and Human Translations
%A Jon, Josef
%A Bojar, Ondřej
%Y Vanroy, Bram
%Y Lefer, Marie-Aude
%Y Macken, Lieve
%Y Ruffo, Paola
%S Proceedings of the 1st Workshop on Creative-text Translation and Technology
%D 2024
%8 June
%I European Association for Machine Translation
%C Sheffield, United Kingdom
%F jon-bojar-2024-analysis
%X This study examines neural machine translation (NMT) and its performance on texts that diverege from typical standards, focusing on how information is organized within sentences. We analyze surprisal distributions in source texts, human translations, and machine translations across several datasets to determine if NMT systems naturally promote a uniform density of surprisal in their translations, even when the original texts do not adhere to this principle.The findings reveal that NMT tends to align more closely with source texts in terms of surprisal uniformity compared to human translations.We analyzed absolute values of the surprisal uniformity measures as well, expecting that human translations will be less uniform. In contradiction to our initial hypothesis, we did not find comprehensive evidence for this claim, with some results suggesting this might be the case for very diverse texts, like poetry.
%U https://aclanthology.org/2024.ctt-1.5
%P 40-56
Markdown (Informal)
[An Analysis of Surprisal Uniformity in Machine and Human Translations](https://aclanthology.org/2024.ctt-1.5) (Jon & Bojar, CTT-WS 2024)
ACL