@article{umair-etal-2022-gailbot,
title = "{G}ail{B}ot: An automatic transcription system for Conversation Analysis",
author = "Umair, Muhammad and
Mertens, Julia Beret and
Albert, Saul and
Ruiter, Jan Peter De",
editor = "Stent, Amanda and
Eugenio, Barbara Di and
Poesio, Massimo and
Georgila, Kallirroi and
Stede, Manfred",
journal = "Dialogue {\&} Discourse",
volume = "13",
month = apr,
year = "2022",
address = "Chicago, Illinois, USA",
publisher = "University of Illinois Chicago",
url = "https://aclanthology.org/2022.dnd-13.5/",
doi = "10.5210/dad.2022.103",
pages = "63--95",
abstract = "Researchers studying human interaction, such as conversation analysts, psychologists, and linguists, all rely on detailed transcriptions of language use. Ideally, these should include so-called paralinguistic features of talk, such as overlaps, prosody, and intonation, as they convey important information. However, creating conversational transcripts that include these features by hand requires substantial amounts of time by trained transcribers. There are currently no Speech to Text (STT) systems that are able to integrate these features in the generated transcript. To reduce the resources needed to create detailed conversation transcripts that include representation of paralinguistic features, we developed a program called GailBot. GailBot combines STT services with plugins to automatically generate first drafts of transcripts that largely follow the transcription standards common in the field of Conversation Analysis. It also enables researchers to add new plugins to transcribe additional features, or to improve the plugins it currently uses. We describe GailBot{'}s architecture and its use of computational heuristics and machine learning. We also evaluate its output in relation to transcripts produced by both human transcribers and comparable automated transcription systems. We argue that despite its limitations, GailBot represents a substantial improvement over existing dialogue transcription software."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="umair-etal-2022-gailbot">
<titleInfo>
<title>GailBot: An automatic transcription system for Conversation Analysis</title>
</titleInfo>
<name type="personal">
<namePart type="given">Muhammad</namePart>
<namePart type="family">Umair</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Julia</namePart>
<namePart type="given">Beret</namePart>
<namePart type="family">Mertens</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Saul</namePart>
<namePart type="family">Albert</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jan</namePart>
<namePart type="given">Peter</namePart>
<namePart type="given">De</namePart>
<namePart type="family">Ruiter</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2022-04</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<genre authority="bibutilsgt">journal article</genre>
<relatedItem type="host">
<titleInfo>
<title>Dialogue & Discourse</title>
</titleInfo>
<originInfo>
<issuance>continuing</issuance>
<publisher>University of Illinois Chicago</publisher>
<place>
<placeTerm type="text">Chicago, Illinois, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">periodical</genre>
<genre authority="bibutilsgt">academic journal</genre>
</relatedItem>
<abstract>Researchers studying human interaction, such as conversation analysts, psychologists, and linguists, all rely on detailed transcriptions of language use. Ideally, these should include so-called paralinguistic features of talk, such as overlaps, prosody, and intonation, as they convey important information. However, creating conversational transcripts that include these features by hand requires substantial amounts of time by trained transcribers. There are currently no Speech to Text (STT) systems that are able to integrate these features in the generated transcript. To reduce the resources needed to create detailed conversation transcripts that include representation of paralinguistic features, we developed a program called GailBot. GailBot combines STT services with plugins to automatically generate first drafts of transcripts that largely follow the transcription standards common in the field of Conversation Analysis. It also enables researchers to add new plugins to transcribe additional features, or to improve the plugins it currently uses. We describe GailBot’s architecture and its use of computational heuristics and machine learning. We also evaluate its output in relation to transcripts produced by both human transcribers and comparable automated transcription systems. We argue that despite its limitations, GailBot represents a substantial improvement over existing dialogue transcription software.</abstract>
<identifier type="citekey">umair-etal-2022-gailbot</identifier>
<identifier type="doi">10.5210/dad.2022.103</identifier>
<location>
<url>https://aclanthology.org/2022.dnd-13.5/</url>
</location>
<part>
<date>2022-04</date>
<detail type="volume"><number>13</number></detail>
<extent unit="page">
<start>63</start>
<end>95</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Journal Article
%T GailBot: An automatic transcription system for Conversation Analysis
%A Umair, Muhammad
%A Mertens, Julia Beret
%A Albert, Saul
%A Ruiter, Jan Peter De
%J Dialogue & Discourse
%D 2022
%8 April
%V 13
%I University of Illinois Chicago
%C Chicago, Illinois, USA
%F umair-etal-2022-gailbot
%X Researchers studying human interaction, such as conversation analysts, psychologists, and linguists, all rely on detailed transcriptions of language use. Ideally, these should include so-called paralinguistic features of talk, such as overlaps, prosody, and intonation, as they convey important information. However, creating conversational transcripts that include these features by hand requires substantial amounts of time by trained transcribers. There are currently no Speech to Text (STT) systems that are able to integrate these features in the generated transcript. To reduce the resources needed to create detailed conversation transcripts that include representation of paralinguistic features, we developed a program called GailBot. GailBot combines STT services with plugins to automatically generate first drafts of transcripts that largely follow the transcription standards common in the field of Conversation Analysis. It also enables researchers to add new plugins to transcribe additional features, or to improve the plugins it currently uses. We describe GailBot’s architecture and its use of computational heuristics and machine learning. We also evaluate its output in relation to transcripts produced by both human transcribers and comparable automated transcription systems. We argue that despite its limitations, GailBot represents a substantial improvement over existing dialogue transcription software.
%R 10.5210/dad.2022.103
%U https://aclanthology.org/2022.dnd-13.5/
%U https://doi.org/10.5210/dad.2022.103
%P 63-95
Markdown (Informal)
[GailBot: An automatic transcription system for Conversation Analysis](https://aclanthology.org/2022.dnd-13.5/) (Umair et al., DND 2022)
ACL