@inproceedings{dabre-sukhoo-2022-kreolmorisienmt,
title = "{K}reol{M}orisien{MT}: A Dataset for Mauritian Creole Machine Translation",
author = "Dabre, Raj and
Sukhoo, Aneerav",
editor = "He, Yulan and
Ji, Heng and
Li, Sujian and
Liu, Yang and
Chang, Chua-Hui",
booktitle = "Findings of the Association for Computational Linguistics: AACL-IJCNLP 2022",
month = nov,
year = "2022",
address = "Online only",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.findings-aacl.3/",
doi = "10.18653/v1/2022.findings-aacl.3",
pages = "22--29",
abstract = "In this paper, we describe KreolMorisienMT, a dataset for benchmarking machine translation quality of Mauritian Creole. Mauritian Creole (Kreol Morisien) is a French-based creole and a lingua franca of the Republic of Mauritius. KreolMorisienMT consists of a parallel corpus between English and Kreol Morisien, French and Kreol Morisien and a monolingual corpus for Kreol Morisien. We first give an overview of Kreol Morisien and then describe the steps taken to create the corpora. Thereafter, we benchmark Kreol Morisien {\ensuremath{\leftrightarrow}} English and Kreol Morisien {\ensuremath{\leftrightarrow}} French models leveraging pre-trained models and multilingual transfer learning. Human evaluation reveals our systems' high translation quality."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="dabre-sukhoo-2022-kreolmorisienmt">
<titleInfo>
<title>KreolMorisienMT: A Dataset for Mauritian Creole Machine Translation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Raj</namePart>
<namePart type="family">Dabre</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Aneerav</namePart>
<namePart type="family">Sukhoo</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2022-11</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Findings of the Association for Computational Linguistics: AACL-IJCNLP 2022</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yulan</namePart>
<namePart type="family">He</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Heng</namePart>
<namePart type="family">Ji</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Sujian</namePart>
<namePart type="family">Li</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Yang</namePart>
<namePart type="family">Liu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chua-Hui</namePart>
<namePart type="family">Chang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Online only</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we describe KreolMorisienMT, a dataset for benchmarking machine translation quality of Mauritian Creole. Mauritian Creole (Kreol Morisien) is a French-based creole and a lingua franca of the Republic of Mauritius. KreolMorisienMT consists of a parallel corpus between English and Kreol Morisien, French and Kreol Morisien and a monolingual corpus for Kreol Morisien. We first give an overview of Kreol Morisien and then describe the steps taken to create the corpora. Thereafter, we benchmark Kreol Morisien \ensuremathłeftrightarrow English and Kreol Morisien \ensuremathłeftrightarrow French models leveraging pre-trained models and multilingual transfer learning. Human evaluation reveals our systems’ high translation quality.</abstract>
<identifier type="citekey">dabre-sukhoo-2022-kreolmorisienmt</identifier>
<identifier type="doi">10.18653/v1/2022.findings-aacl.3</identifier>
<location>
<url>https://aclanthology.org/2022.findings-aacl.3/</url>
</location>
<part>
<date>2022-11</date>
<extent unit="page">
<start>22</start>
<end>29</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T KreolMorisienMT: A Dataset for Mauritian Creole Machine Translation
%A Dabre, Raj
%A Sukhoo, Aneerav
%Y He, Yulan
%Y Ji, Heng
%Y Li, Sujian
%Y Liu, Yang
%Y Chang, Chua-Hui
%S Findings of the Association for Computational Linguistics: AACL-IJCNLP 2022
%D 2022
%8 November
%I Association for Computational Linguistics
%C Online only
%F dabre-sukhoo-2022-kreolmorisienmt
%X In this paper, we describe KreolMorisienMT, a dataset for benchmarking machine translation quality of Mauritian Creole. Mauritian Creole (Kreol Morisien) is a French-based creole and a lingua franca of the Republic of Mauritius. KreolMorisienMT consists of a parallel corpus between English and Kreol Morisien, French and Kreol Morisien and a monolingual corpus for Kreol Morisien. We first give an overview of Kreol Morisien and then describe the steps taken to create the corpora. Thereafter, we benchmark Kreol Morisien \ensuremathłeftrightarrow English and Kreol Morisien \ensuremathłeftrightarrow French models leveraging pre-trained models and multilingual transfer learning. Human evaluation reveals our systems’ high translation quality.
%R 10.18653/v1/2022.findings-aacl.3
%U https://aclanthology.org/2022.findings-aacl.3/
%U https://doi.org/10.18653/v1/2022.findings-aacl.3
%P 22-29
Markdown (Informal)
[KreolMorisienMT: A Dataset for Mauritian Creole Machine Translation](https://aclanthology.org/2022.findings-aacl.3/) (Dabre & Sukhoo, Findings 2022)
ACL