@inproceedings{van-der-goot-2019-monoise,
title = "{M}o{N}oise: A Multi-lingual and Easy-to-use Lexical Normalization Tool",
author = "van der Goot, Rob",
editor = "Costa-juss{\`a}, Marta R. and
Alfonseca, Enrique",
booktitle = "Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics: System Demonstrations",
month = jul,
year = "2019",
address = "Florence, Italy",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/P19-3032",
doi = "10.18653/v1/P19-3032",
pages = "201--206",
abstract = "In this paper, we introduce and demonstrate the online demo as well as the command line interface of a lexical normalization system (MoNoise) for a variety of languages. We further improve this model by using features from the original word for every normalization candidate. For comparison with future work, we propose the bundling of seven datasets in six languages to form a new benchmark, together with a novel evaluation metric which is particularly suitable for cross-dataset comparisons. MoNoise reaches a new state-of-art performance for six out of seven of these datasets. Furthermore, we allow the user to tune the {`}aggressiveness{'} of the normalization, and show how the model can be made more efficient with only a small loss in performance. The online demo can be found on: \url{http://www.robvandergoot.com/monoise} and the corresponding code on: \url{https://bitbucket.org/robvanderg/monoise/}",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="van-der-goot-2019-monoise">
<titleInfo>
<title>MoNoise: A Multi-lingual and Easy-to-use Lexical Normalization Tool</title>
</titleInfo>
<name type="personal">
<namePart type="given">Rob</namePart>
<namePart type="family">van der Goot</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics: System Demonstrations</title>
</titleInfo>
<name type="personal">
<namePart type="given">Marta</namePart>
<namePart type="given">R</namePart>
<namePart type="family">Costa-jussà</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Enrique</namePart>
<namePart type="family">Alfonseca</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Florence, Italy</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we introduce and demonstrate the online demo as well as the command line interface of a lexical normalization system (MoNoise) for a variety of languages. We further improve this model by using features from the original word for every normalization candidate. For comparison with future work, we propose the bundling of seven datasets in six languages to form a new benchmark, together with a novel evaluation metric which is particularly suitable for cross-dataset comparisons. MoNoise reaches a new state-of-art performance for six out of seven of these datasets. Furthermore, we allow the user to tune the ‘aggressiveness’ of the normalization, and show how the model can be made more efficient with only a small loss in performance. The online demo can be found on: http://www.robvandergoot.com/monoise and the corresponding code on: https://bitbucket.org/robvanderg/monoise/</abstract>
<identifier type="citekey">van-der-goot-2019-monoise</identifier>
<identifier type="doi">10.18653/v1/P19-3032</identifier>
<location>
<url>https://aclanthology.org/P19-3032</url>
</location>
<part>
<date>2019-07</date>
<extent unit="page">
<start>201</start>
<end>206</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T MoNoise: A Multi-lingual and Easy-to-use Lexical Normalization Tool
%A van der Goot, Rob
%Y Costa-jussà, Marta R.
%Y Alfonseca, Enrique
%S Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics: System Demonstrations
%D 2019
%8 July
%I Association for Computational Linguistics
%C Florence, Italy
%F van-der-goot-2019-monoise
%X In this paper, we introduce and demonstrate the online demo as well as the command line interface of a lexical normalization system (MoNoise) for a variety of languages. We further improve this model by using features from the original word for every normalization candidate. For comparison with future work, we propose the bundling of seven datasets in six languages to form a new benchmark, together with a novel evaluation metric which is particularly suitable for cross-dataset comparisons. MoNoise reaches a new state-of-art performance for six out of seven of these datasets. Furthermore, we allow the user to tune the ‘aggressiveness’ of the normalization, and show how the model can be made more efficient with only a small loss in performance. The online demo can be found on: http://www.robvandergoot.com/monoise and the corresponding code on: https://bitbucket.org/robvanderg/monoise/
%R 10.18653/v1/P19-3032
%U https://aclanthology.org/P19-3032
%U https://doi.org/10.18653/v1/P19-3032
%P 201-206
Markdown (Informal)
[MoNoise: A Multi-lingual and Easy-to-use Lexical Normalization Tool](https://aclanthology.org/P19-3032) (van der Goot, ACL 2019)
ACL