@inproceedings{oliver-alvarez-vidal-2024-litpc,
title = "{L}it{PC}: A set of tools for building parallel corporafrom literary works",
author = "Oliver, Antoni and
Alvarez-Vidal, Sergi",
editor = "Vanroy, Bram and
Lefer, Marie-Aude and
Macken, Lieve and
Ruffo, Paola",
booktitle = "Proceedings of the 1st Workshop on Creative-text Translation and Technology",
month = jun,
year = "2024",
address = "Sheffield, United Kingdom",
publisher = "European Association for Machine Translation",
url = "https://aclanthology.org/2024.ctt-1.3",
pages = "21--31",
abstract = "In this paper, we describe the LitPC toolkit, a variety of tools and methods designed for the quick and effective creation of parallel corpora derived from literary works. This toolkit can be a useful resource due to the scarcity of curated parallel texts for this domain. We also feature a case study describing the creation of a Russian-English parallel corpus based on the literary works by Leo Tolstoy. Furthermore, an augmented version of this corpus is used to both train and assess neural machine translation systems specifically adapted to the author{'}s style.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="oliver-alvarez-vidal-2024-litpc">
<titleInfo>
<title>LitPC: A set of tools for building parallel corporafrom literary works</title>
</titleInfo>
<name type="personal">
<namePart type="given">Antoni</namePart>
<namePart type="family">Oliver</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Sergi</namePart>
<namePart type="family">Alvarez-Vidal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2024-06</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 1st Workshop on Creative-text Translation and Technology</title>
</titleInfo>
<name type="personal">
<namePart type="given">Bram</namePart>
<namePart type="family">Vanroy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Marie-Aude</namePart>
<namePart type="family">Lefer</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lieve</namePart>
<namePart type="family">Macken</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Paola</namePart>
<namePart type="family">Ruffo</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>European Association for Machine Translation</publisher>
<place>
<placeTerm type="text">Sheffield, United Kingdom</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we describe the LitPC toolkit, a variety of tools and methods designed for the quick and effective creation of parallel corpora derived from literary works. This toolkit can be a useful resource due to the scarcity of curated parallel texts for this domain. We also feature a case study describing the creation of a Russian-English parallel corpus based on the literary works by Leo Tolstoy. Furthermore, an augmented version of this corpus is used to both train and assess neural machine translation systems specifically adapted to the author’s style.</abstract>
<identifier type="citekey">oliver-alvarez-vidal-2024-litpc</identifier>
<location>
<url>https://aclanthology.org/2024.ctt-1.3</url>
</location>
<part>
<date>2024-06</date>
<extent unit="page">
<start>21</start>
<end>31</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T LitPC: A set of tools for building parallel corporafrom literary works
%A Oliver, Antoni
%A Alvarez-Vidal, Sergi
%Y Vanroy, Bram
%Y Lefer, Marie-Aude
%Y Macken, Lieve
%Y Ruffo, Paola
%S Proceedings of the 1st Workshop on Creative-text Translation and Technology
%D 2024
%8 June
%I European Association for Machine Translation
%C Sheffield, United Kingdom
%F oliver-alvarez-vidal-2024-litpc
%X In this paper, we describe the LitPC toolkit, a variety of tools and methods designed for the quick and effective creation of parallel corpora derived from literary works. This toolkit can be a useful resource due to the scarcity of curated parallel texts for this domain. We also feature a case study describing the creation of a Russian-English parallel corpus based on the literary works by Leo Tolstoy. Furthermore, an augmented version of this corpus is used to both train and assess neural machine translation systems specifically adapted to the author’s style.
%U https://aclanthology.org/2024.ctt-1.3
%P 21-31
Markdown (Informal)
[LitPC: A set of tools for building parallel corporafrom literary works](https://aclanthology.org/2024.ctt-1.3) (Oliver & Alvarez-Vidal, CTT-WS 2024)
ACL