@inproceedings{sigurgeirsson-etal-2021-talromur,
title = "{T}alr{\'o}mur: A large {I}celandic {TTS} corpus",
author = {Sigurgeirsson, Atli and
Gunnarsson, {\TH}orsteinn and
{\"O}rn{\'o}lfsson, Gunnar and
Magn{\'u}sd{\'o}ttir, Eyd{\'i}s and
{\TH}{\'o}rhallsd{\'o}ttir, Ragnhei{\dh}ur and
J{\'o}nsson, Stef{\'a}n and
Gu{\dh}nason, J{\'o}n},
editor = "Dobnik, Simon and
{\O}vrelid, Lilja",
booktitle = "Proceedings of the 23rd Nordic Conference on Computational Linguistics (NoDaLiDa)",
month = may # " 31--2 " # jun,
year = "2021",
address = "Reykjavik, Iceland (Online)",
publisher = {Link{\"o}ping University Electronic Press, Sweden},
url = "https://aclanthology.org/2021.nodalida-main.50/",
pages = "440--444",
abstract = "We present Talr{\'o}mur, a large high-quality Text-To-Speech (TTS) corpus for the Icelandic language. This multi-speaker corpus contains recordings from 4 male speakers and 4 female speakers of a wide range in age and speaking style. The corpus consists of 122,417 single utterance recordings equating to approximately 213 hours of voice data. All speakers read from the same script which has a high coverage of possible Icelandic diphones. Manual analysis of 15,956 utterances indicates that the corpus has a reading mistake rate no higher than 0.25{\%}. We additionally present results from subjective evaluations of the different voices with regards to intelligibility, likeability and trustworthiness."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="sigurgeirsson-etal-2021-talromur">
<titleInfo>
<title>Talrómur: A large Icelandic TTS corpus</title>
</titleInfo>
<name type="personal">
<namePart type="given">Atli</namePart>
<namePart type="family">Sigurgeirsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">\THorsteinn</namePart>
<namePart type="family">Gunnarsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Gunnar</namePart>
<namePart type="family">Örnólfsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Eydís</namePart>
<namePart type="family">Magnúsdóttir</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ragnhei\dhur</namePart>
<namePart type="family">\THórhallsdóttir</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Stefán</namePart>
<namePart type="family">Jónsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jón</namePart>
<namePart type="family">Gu\dhnason</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2021-may 31–2 jun</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 23rd Nordic Conference on Computational Linguistics (NoDaLiDa)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Simon</namePart>
<namePart type="family">Dobnik</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lilja</namePart>
<namePart type="family">Øvrelid</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Linköping University Electronic Press, Sweden</publisher>
<place>
<placeTerm type="text">Reykjavik, Iceland (Online)</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We present Talrómur, a large high-quality Text-To-Speech (TTS) corpus for the Icelandic language. This multi-speaker corpus contains recordings from 4 male speakers and 4 female speakers of a wide range in age and speaking style. The corpus consists of 122,417 single utterance recordings equating to approximately 213 hours of voice data. All speakers read from the same script which has a high coverage of possible Icelandic diphones. Manual analysis of 15,956 utterances indicates that the corpus has a reading mistake rate no higher than 0.25%. We additionally present results from subjective evaluations of the different voices with regards to intelligibility, likeability and trustworthiness.</abstract>
<identifier type="citekey">sigurgeirsson-etal-2021-talromur</identifier>
<location>
<url>https://aclanthology.org/2021.nodalida-main.50/</url>
</location>
<part>
<date>2021-may 31–2 jun</date>
<extent unit="page">
<start>440</start>
<end>444</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Talrómur: A large Icelandic TTS corpus
%A Sigurgeirsson, Atli
%A Gunnarsson, \THorsteinn
%A Örnólfsson, Gunnar
%A Magnúsdóttir, Eydís
%A \THórhallsdóttir, Ragnhei\dhur
%A Jónsson, Stefán
%A Gu\dhnason, Jón
%Y Dobnik, Simon
%Y Øvrelid, Lilja
%S Proceedings of the 23rd Nordic Conference on Computational Linguistics (NoDaLiDa)
%D 2021
%8 may 31–2 jun
%I Linköping University Electronic Press, Sweden
%C Reykjavik, Iceland (Online)
%F sigurgeirsson-etal-2021-talromur
%X We present Talrómur, a large high-quality Text-To-Speech (TTS) corpus for the Icelandic language. This multi-speaker corpus contains recordings from 4 male speakers and 4 female speakers of a wide range in age and speaking style. The corpus consists of 122,417 single utterance recordings equating to approximately 213 hours of voice data. All speakers read from the same script which has a high coverage of possible Icelandic diphones. Manual analysis of 15,956 utterances indicates that the corpus has a reading mistake rate no higher than 0.25%. We additionally present results from subjective evaluations of the different voices with regards to intelligibility, likeability and trustworthiness.
%U https://aclanthology.org/2021.nodalida-main.50/
%P 440-444
Markdown (Informal)
[Talrómur: A large Icelandic TTS corpus](https://aclanthology.org/2021.nodalida-main.50/) (Sigurgeirsson et al., NoDaLiDa 2021)
ACL
- Atli Sigurgeirsson, Þorsteinn Gunnarsson, Gunnar Örnólfsson, Eydís Magnúsdóttir, Ragnheiður Þórhallsdóttir, Stefán Jónsson, and Jón Guðnason. 2021. Talrómur: A large Icelandic TTS corpus. In Proceedings of the 23rd Nordic Conference on Computational Linguistics (NoDaLiDa), pages 440–444, Reykjavik, Iceland (Online). Linköping University Electronic Press, Sweden.