@inproceedings{le-ferrand-prudhommeaux-2024-automatic,
title = "Automatic Transcription of Grammaticality Judgements for Language Documentation",
author = "Le Ferrand, {\'E}ric and
Prud{'}hommeaux, Emily",
editor = "Moeller, Sarah and
Agyapong, Godfred and
Arppe, Antti and
Chaudhary, Aditi and
Rijhwani, Shruti and
Cox, Christopher and
Henke, Ryan and
Palmer, Alexis and
Rosenblum, Daisy and
Schwartz, Lane",
booktitle = "Proceedings of the Seventh Workshop on the Use of Computational Methods in the Study of Endangered Languages",
month = mar,
year = "2024",
address = "St. Julians, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.computel-1.6",
pages = "33--38",
abstract = "Descriptive linguistics is a sub-field of linguistics that involves the collection and annotationof language resources to describe linguistic phenomena. The transcription of these resources is often described as a tedious task, and Automatic Speech Recognition (ASR) has frequently been employed to support this process. However, the typical research approach to ASR in documentary linguistics often only captures a subset of the field{'}s diverse reality. In this paper, we focus specifically on one type of data known as grammaticality judgment elicitation in the context of documenting Kr{\'e}y{\`o}l Gwadloup{\'e}yen. We show that only a few minutes of speech is enough to fine-tune a model originally trained in French to transcribe segments in Kr{\'e}yol.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="le-ferrand-prudhommeaux-2024-automatic">
<titleInfo>
<title>Automatic Transcription of Grammaticality Judgements for Language Documentation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Éric</namePart>
<namePart type="family">Le Ferrand</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Emily</namePart>
<namePart type="family">Prud’hommeaux</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2024-03</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Seventh Workshop on the Use of Computational Methods in the Study of Endangered Languages</title>
</titleInfo>
<name type="personal">
<namePart type="given">Sarah</namePart>
<namePart type="family">Moeller</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Godfred</namePart>
<namePart type="family">Agyapong</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Antti</namePart>
<namePart type="family">Arppe</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Aditi</namePart>
<namePart type="family">Chaudhary</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Shruti</namePart>
<namePart type="family">Rijhwani</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Christopher</namePart>
<namePart type="family">Cox</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ryan</namePart>
<namePart type="family">Henke</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Alexis</namePart>
<namePart type="family">Palmer</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Daisy</namePart>
<namePart type="family">Rosenblum</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lane</namePart>
<namePart type="family">Schwartz</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">St. Julians, Malta</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Descriptive linguistics is a sub-field of linguistics that involves the collection and annotationof language resources to describe linguistic phenomena. The transcription of these resources is often described as a tedious task, and Automatic Speech Recognition (ASR) has frequently been employed to support this process. However, the typical research approach to ASR in documentary linguistics often only captures a subset of the field’s diverse reality. In this paper, we focus specifically on one type of data known as grammaticality judgment elicitation in the context of documenting Kréyòl Gwadloupéyen. We show that only a few minutes of speech is enough to fine-tune a model originally trained in French to transcribe segments in Kréyol.</abstract>
<identifier type="citekey">le-ferrand-prudhommeaux-2024-automatic</identifier>
<location>
<url>https://aclanthology.org/2024.computel-1.6</url>
</location>
<part>
<date>2024-03</date>
<extent unit="page">
<start>33</start>
<end>38</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Automatic Transcription of Grammaticality Judgements for Language Documentation
%A Le Ferrand, Éric
%A Prud’hommeaux, Emily
%Y Moeller, Sarah
%Y Agyapong, Godfred
%Y Arppe, Antti
%Y Chaudhary, Aditi
%Y Rijhwani, Shruti
%Y Cox, Christopher
%Y Henke, Ryan
%Y Palmer, Alexis
%Y Rosenblum, Daisy
%Y Schwartz, Lane
%S Proceedings of the Seventh Workshop on the Use of Computational Methods in the Study of Endangered Languages
%D 2024
%8 March
%I Association for Computational Linguistics
%C St. Julians, Malta
%F le-ferrand-prudhommeaux-2024-automatic
%X Descriptive linguistics is a sub-field of linguistics that involves the collection and annotationof language resources to describe linguistic phenomena. The transcription of these resources is often described as a tedious task, and Automatic Speech Recognition (ASR) has frequently been employed to support this process. However, the typical research approach to ASR in documentary linguistics often only captures a subset of the field’s diverse reality. In this paper, we focus specifically on one type of data known as grammaticality judgment elicitation in the context of documenting Kréyòl Gwadloupéyen. We show that only a few minutes of speech is enough to fine-tune a model originally trained in French to transcribe segments in Kréyol.
%U https://aclanthology.org/2024.computel-1.6
%P 33-38
Markdown (Informal)
[Automatic Transcription of Grammaticality Judgements for Language Documentation](https://aclanthology.org/2024.computel-1.6) (Le Ferrand & Prud’hommeaux, ComputEL-WS 2024)
ACL