@inproceedings{dorn-2019-dialect,
title = "Dialect-Specific Models for Automatic Speech Recognition of {A}frican {A}merican {V}ernacular {E}nglish",
author = "Dorn, Rachel",
editor = "Kovatchev, Venelin and
Temnikova, Irina and
{\v{S}}andrih, Branislava and
Nikolova, Ivelina",
booktitle = "Proceedings of the Student Research Workshop Associated with RANLP 2019",
month = sep,
year = "2019",
address = "Varna, Bulgaria",
publisher = "INCOMA Ltd.",
url = "https://aclanthology.org/R19-2003/",
doi = "10.26615/issn.2603-2821.2019_003",
pages = "16--20",
abstract = "African American Vernacular English (AAVE) is a widely-spoken dialect of English, yet it is under-represented in major speech corpora. As a result, speakers of this dialect are often misunderstood by NLP applications. This study explores the effect on transcription accuracy of an automatic voice recognition system when AAVE data is used. Models trained on AAVE data and on Standard American English data were compared to a baseline model trained on a combination of the two dialects. The accuracy for both dialect-specific models was significantly higher than the baseline model, with the AAVE model showing over 18{\%} improvement. By isolating the effect of having AAVE speakers in the training data, this study highlights the importance of increasing diversity in the field of natural language processing."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="dorn-2019-dialect">
<titleInfo>
<title>Dialect-Specific Models for Automatic Speech Recognition of African American Vernacular English</title>
</titleInfo>
<name type="personal">
<namePart type="given">Rachel</namePart>
<namePart type="family">Dorn</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-09</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Student Research Workshop Associated with RANLP 2019</title>
</titleInfo>
<name type="personal">
<namePart type="given">Venelin</namePart>
<namePart type="family">Kovatchev</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Irina</namePart>
<namePart type="family">Temnikova</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Branislava</namePart>
<namePart type="family">Šandrih</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ivelina</namePart>
<namePart type="family">Nikolova</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>INCOMA Ltd.</publisher>
<place>
<placeTerm type="text">Varna, Bulgaria</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>African American Vernacular English (AAVE) is a widely-spoken dialect of English, yet it is under-represented in major speech corpora. As a result, speakers of this dialect are often misunderstood by NLP applications. This study explores the effect on transcription accuracy of an automatic voice recognition system when AAVE data is used. Models trained on AAVE data and on Standard American English data were compared to a baseline model trained on a combination of the two dialects. The accuracy for both dialect-specific models was significantly higher than the baseline model, with the AAVE model showing over 18% improvement. By isolating the effect of having AAVE speakers in the training data, this study highlights the importance of increasing diversity in the field of natural language processing.</abstract>
<identifier type="citekey">dorn-2019-dialect</identifier>
<identifier type="doi">10.26615/issn.2603-2821.2019_003</identifier>
<location>
<url>https://aclanthology.org/R19-2003/</url>
</location>
<part>
<date>2019-09</date>
<extent unit="page">
<start>16</start>
<end>20</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Dialect-Specific Models for Automatic Speech Recognition of African American Vernacular English
%A Dorn, Rachel
%Y Kovatchev, Venelin
%Y Temnikova, Irina
%Y Šandrih, Branislava
%Y Nikolova, Ivelina
%S Proceedings of the Student Research Workshop Associated with RANLP 2019
%D 2019
%8 September
%I INCOMA Ltd.
%C Varna, Bulgaria
%F dorn-2019-dialect
%X African American Vernacular English (AAVE) is a widely-spoken dialect of English, yet it is under-represented in major speech corpora. As a result, speakers of this dialect are often misunderstood by NLP applications. This study explores the effect on transcription accuracy of an automatic voice recognition system when AAVE data is used. Models trained on AAVE data and on Standard American English data were compared to a baseline model trained on a combination of the two dialects. The accuracy for both dialect-specific models was significantly higher than the baseline model, with the AAVE model showing over 18% improvement. By isolating the effect of having AAVE speakers in the training data, this study highlights the importance of increasing diversity in the field of natural language processing.
%R 10.26615/issn.2603-2821.2019_003
%U https://aclanthology.org/R19-2003/
%U https://doi.org/10.26615/issn.2603-2821.2019_003
%P 16-20
Markdown (Informal)
[Dialect-Specific Models for Automatic Speech Recognition of African American Vernacular English](https://aclanthology.org/R19-2003/) (Dorn, RANLP 2019)
ACL