@inproceedings{mcgill-saggion-2023-bsl,
title = "{BSL}-{H}ansard: A parallel, multimodal corpus of {E}nglish and interpreted {B}ritish {S}ign {L}anguage data from parliamentary proceedings",
author = "McGill, Euan and
Saggion, Horacio",
editor = "Shterionov, Dimitar and
Sisto, Mirella De and
Muller, Mathias and
Landuyt, Davy Van and
Omardeen, Rehana and
Oboyle, Shaun and
Braffort, Annelies and
Roelofsen, Floris and
Blain, Fred and
Vanroy, Bram and
Avramidis, Eleftherios",
booktitle = "Proceedings of the Second International Workshop on Automatic Translation for Signed and Spoken Languages",
month = jun,
year = "2023",
address = "Tampere, Finland",
publisher = "European Association for Machine Translation",
url = "https://aclanthology.org/2023.at4ssl-1.5",
pages = "38--43",
abstract = "BSL-Hansard is a novel open source and multimodal resource composed by combining Sign Language video data in BSL and English text from the official transcription of British parliamentary sessions. This paper describes the method followed to compile BSL-Hansard including time alignment of text using the MAUS (Schiel, 2015) segmentation system, gives some statistics about this dataset, and suggests experiments. These primarily include end-to-end Sign Language-to-text translation, but is also relevant for broader machine translation, and speech and language processing tasks.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="mcgill-saggion-2023-bsl">
<titleInfo>
<title>BSL-Hansard: A parallel, multimodal corpus of English and interpreted British Sign Language data from parliamentary proceedings</title>
</titleInfo>
<name type="personal">
<namePart type="given">Euan</namePart>
<namePart type="family">McGill</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Horacio</namePart>
<namePart type="family">Saggion</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2023-06</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Second International Workshop on Automatic Translation for Signed and Spoken Languages</title>
</titleInfo>
<name type="personal">
<namePart type="given">Dimitar</namePart>
<namePart type="family">Shterionov</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mirella</namePart>
<namePart type="given">De</namePart>
<namePart type="family">Sisto</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mathias</namePart>
<namePart type="family">Muller</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Davy</namePart>
<namePart type="given">Van</namePart>
<namePart type="family">Landuyt</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Rehana</namePart>
<namePart type="family">Omardeen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Shaun</namePart>
<namePart type="family">Oboyle</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Annelies</namePart>
<namePart type="family">Braffort</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Floris</namePart>
<namePart type="family">Roelofsen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Fred</namePart>
<namePart type="family">Blain</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Bram</namePart>
<namePart type="family">Vanroy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Eleftherios</namePart>
<namePart type="family">Avramidis</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>European Association for Machine Translation</publisher>
<place>
<placeTerm type="text">Tampere, Finland</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>BSL-Hansard is a novel open source and multimodal resource composed by combining Sign Language video data in BSL and English text from the official transcription of British parliamentary sessions. This paper describes the method followed to compile BSL-Hansard including time alignment of text using the MAUS (Schiel, 2015) segmentation system, gives some statistics about this dataset, and suggests experiments. These primarily include end-to-end Sign Language-to-text translation, but is also relevant for broader machine translation, and speech and language processing tasks.</abstract>
<identifier type="citekey">mcgill-saggion-2023-bsl</identifier>
<location>
<url>https://aclanthology.org/2023.at4ssl-1.5</url>
</location>
<part>
<date>2023-06</date>
<extent unit="page">
<start>38</start>
<end>43</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T BSL-Hansard: A parallel, multimodal corpus of English and interpreted British Sign Language data from parliamentary proceedings
%A McGill, Euan
%A Saggion, Horacio
%Y Shterionov, Dimitar
%Y Sisto, Mirella De
%Y Muller, Mathias
%Y Landuyt, Davy Van
%Y Omardeen, Rehana
%Y Oboyle, Shaun
%Y Braffort, Annelies
%Y Roelofsen, Floris
%Y Blain, Fred
%Y Vanroy, Bram
%Y Avramidis, Eleftherios
%S Proceedings of the Second International Workshop on Automatic Translation for Signed and Spoken Languages
%D 2023
%8 June
%I European Association for Machine Translation
%C Tampere, Finland
%F mcgill-saggion-2023-bsl
%X BSL-Hansard is a novel open source and multimodal resource composed by combining Sign Language video data in BSL and English text from the official transcription of British parliamentary sessions. This paper describes the method followed to compile BSL-Hansard including time alignment of text using the MAUS (Schiel, 2015) segmentation system, gives some statistics about this dataset, and suggests experiments. These primarily include end-to-end Sign Language-to-text translation, but is also relevant for broader machine translation, and speech and language processing tasks.
%U https://aclanthology.org/2023.at4ssl-1.5
%P 38-43
Markdown (Informal)
[BSL-Hansard: A parallel, multimodal corpus of English and interpreted British Sign Language data from parliamentary proceedings](https://aclanthology.org/2023.at4ssl-1.5) (McGill & Saggion, AT4SSL 2023)
ACL