@inproceedings{albogamy-ramsay-2016-unsupervised,
title = "Unsupervised Stemmer for {A}rabic Tweets",
author = "Albogamy, Fahad and
Ramsay, Allan",
editor = "Han, Bo and
Ritter, Alan and
Derczynski, Leon and
Xu, Wei and
Baldwin, Tim",
booktitle = "Proceedings of the 2nd Workshop on Noisy User-generated Text ({WNUT})",
month = dec,
year = "2016",
address = "Osaka, Japan",
publisher = "The COLING 2016 Organizing Committee",
url = "https://aclanthology.org/W16-3912",
pages = "78--84",
abstract = "Stemming is an essential processing step in a wide range of high level text processing applications such as information extraction, machine translation and sentiment analysis. It is used to reduce words to their stems. Many stemming algorithms have been developed for Modern Standard Arabic (MSA). Although Arabic tweets and MSA are closely related and share many characteristics, there are substantial differences between them in lexicon and syntax. In this paper, we introduce a light Arabic stemmer for Arabic tweets. Our results show improvements over the performance of a number of well-known stemmers for Arabic.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="albogamy-ramsay-2016-unsupervised">
<titleInfo>
<title>Unsupervised Stemmer for Arabic Tweets</title>
</titleInfo>
<name type="personal">
<namePart type="given">Fahad</namePart>
<namePart type="family">Albogamy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Allan</namePart>
<namePart type="family">Ramsay</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2016-12</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 2nd Workshop on Noisy User-generated Text (WNUT)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Bo</namePart>
<namePart type="family">Han</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Alan</namePart>
<namePart type="family">Ritter</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Leon</namePart>
<namePart type="family">Derczynski</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Wei</namePart>
<namePart type="family">Xu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tim</namePart>
<namePart type="family">Baldwin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>The COLING 2016 Organizing Committee</publisher>
<place>
<placeTerm type="text">Osaka, Japan</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Stemming is an essential processing step in a wide range of high level text processing applications such as information extraction, machine translation and sentiment analysis. It is used to reduce words to their stems. Many stemming algorithms have been developed for Modern Standard Arabic (MSA). Although Arabic tweets and MSA are closely related and share many characteristics, there are substantial differences between them in lexicon and syntax. In this paper, we introduce a light Arabic stemmer for Arabic tweets. Our results show improvements over the performance of a number of well-known stemmers for Arabic.</abstract>
<identifier type="citekey">albogamy-ramsay-2016-unsupervised</identifier>
<location>
<url>https://aclanthology.org/W16-3912</url>
</location>
<part>
<date>2016-12</date>
<extent unit="page">
<start>78</start>
<end>84</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Unsupervised Stemmer for Arabic Tweets
%A Albogamy, Fahad
%A Ramsay, Allan
%Y Han, Bo
%Y Ritter, Alan
%Y Derczynski, Leon
%Y Xu, Wei
%Y Baldwin, Tim
%S Proceedings of the 2nd Workshop on Noisy User-generated Text (WNUT)
%D 2016
%8 December
%I The COLING 2016 Organizing Committee
%C Osaka, Japan
%F albogamy-ramsay-2016-unsupervised
%X Stemming is an essential processing step in a wide range of high level text processing applications such as information extraction, machine translation and sentiment analysis. It is used to reduce words to their stems. Many stemming algorithms have been developed for Modern Standard Arabic (MSA). Although Arabic tweets and MSA are closely related and share many characteristics, there are substantial differences between them in lexicon and syntax. In this paper, we introduce a light Arabic stemmer for Arabic tweets. Our results show improvements over the performance of a number of well-known stemmers for Arabic.
%U https://aclanthology.org/W16-3912
%P 78-84
Markdown (Informal)
[Unsupervised Stemmer for Arabic Tweets](https://aclanthology.org/W16-3912) (Albogamy & Ramsay, WNUT 2016)
ACL
- Fahad Albogamy and Allan Ramsay. 2016. Unsupervised Stemmer for Arabic Tweets. In Proceedings of the 2nd Workshop on Noisy User-generated Text (WNUT), pages 78–84, Osaka, Japan. The COLING 2016 Organizing Committee.