@inproceedings{dinu-etal-2024-verba,
title = "Verba volant, scripta volant? Don{'}t worry! There are computational solutions for protoword reconstruction",
author = "Dinu, Liviu and
Uban, Ana and
Cristea, Alina and
Iordache, Ioan-Bogdan and
Marchitan, Teodor-George and
Georgescu, Simona and
Zoicas, Laurentiu",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.emnlp-main.362",
pages = "6314--6326",
abstract = "We introduce a new database of cognate words and etymons for the five main Romance languages, the most comprehensive one to date. We propose a strong benchmark for the automatic reconstruction of protowords for Romance languages, by applying a set of machine learning models and features on these data. The best results reach 90{\%} accuracy in predicting the protoword of a given cognate set, surpassing existing state-of-the-art results for this task and showing that computational methods can be very useful in assisting linguists with protoword reconstruction.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="dinu-etal-2024-verba">
<titleInfo>
<title>Verba volant, scripta volant? Don’t worry! There are computational solutions for protoword reconstruction</title>
</titleInfo>
<name type="personal">
<namePart type="given">Liviu</namePart>
<namePart type="family">Dinu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ana</namePart>
<namePart type="family">Uban</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Alina</namePart>
<namePart type="family">Cristea</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ioan-Bogdan</namePart>
<namePart type="family">Iordache</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Teodor-George</namePart>
<namePart type="family">Marchitan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Simona</namePart>
<namePart type="family">Georgescu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Laurentiu</namePart>
<namePart type="family">Zoicas</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2024-11</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yaser</namePart>
<namePart type="family">Al-Onaizan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mohit</namePart>
<namePart type="family">Bansal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Yun-Nung</namePart>
<namePart type="family">Chen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Miami, Florida, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We introduce a new database of cognate words and etymons for the five main Romance languages, the most comprehensive one to date. We propose a strong benchmark for the automatic reconstruction of protowords for Romance languages, by applying a set of machine learning models and features on these data. The best results reach 90% accuracy in predicting the protoword of a given cognate set, surpassing existing state-of-the-art results for this task and showing that computational methods can be very useful in assisting linguists with protoword reconstruction.</abstract>
<identifier type="citekey">dinu-etal-2024-verba</identifier>
<location>
<url>https://aclanthology.org/2024.emnlp-main.362</url>
</location>
<part>
<date>2024-11</date>
<extent unit="page">
<start>6314</start>
<end>6326</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Verba volant, scripta volant? Don’t worry! There are computational solutions for protoword reconstruction
%A Dinu, Liviu
%A Uban, Ana
%A Cristea, Alina
%A Iordache, Ioan-Bogdan
%A Marchitan, Teodor-George
%A Georgescu, Simona
%A Zoicas, Laurentiu
%Y Al-Onaizan, Yaser
%Y Bansal, Mohit
%Y Chen, Yun-Nung
%S Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing
%D 2024
%8 November
%I Association for Computational Linguistics
%C Miami, Florida, USA
%F dinu-etal-2024-verba
%X We introduce a new database of cognate words and etymons for the five main Romance languages, the most comprehensive one to date. We propose a strong benchmark for the automatic reconstruction of protowords for Romance languages, by applying a set of machine learning models and features on these data. The best results reach 90% accuracy in predicting the protoword of a given cognate set, surpassing existing state-of-the-art results for this task and showing that computational methods can be very useful in assisting linguists with protoword reconstruction.
%U https://aclanthology.org/2024.emnlp-main.362
%P 6314-6326
Markdown (Informal)
[Verba volant, scripta volant? Don’t worry! There are computational solutions for protoword reconstruction](https://aclanthology.org/2024.emnlp-main.362) (Dinu et al., EMNLP 2024)
ACL
- Liviu Dinu, Ana Uban, Alina Cristea, Ioan-Bogdan Iordache, Teodor-George Marchitan, Simona Georgescu, and Laurentiu Zoicas. 2024. Verba volant, scripta volant? Don’t worry! There are computational solutions for protoword reconstruction. In Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing, pages 6314–6326, Miami, Florida, USA. Association for Computational Linguistics.