@InProceedings{attia-zirikly-diab:2016:CogALex-V,
  author    = {Attia, Mohammed  and  Zirikly, Ayah  and  Diab, Mona},
  title     = {The Power of Language Music: Arabic Lemmatization through Patterns},
  booktitle = {Proceedings of the 5th Workshop on Cognitive Aspects of the Lexicon (CogALex - V)},
  month     = {December},
  year      = {2016},
  address   = {Osaka, Japan},
  publisher = {The COLING 2016 Organizing Committee},
  pages     = {40--50},
  abstract  = {The interaction between roots and patterns in Arabic has intrigued
	lexicographers and morphologists for centuries. While roots provide the
	consonantal building blocks, patterns provide the syllabic vocalic moulds.
	While roots provide abstract semantic classes, patterns realize these classes
	in specific instances. In this way both roots and patterns are indispensable
	for understanding the derivational, morphological and, to some extent, the
	cognitive aspects of the Arabic language. In this paper we perform
	lemmatization (a high-level lexical processing) without relying on a lookup
	dictionary. We use a hybrid approach that consists of a machine learning
	classifier to predict the lemma pattern for a given stem, and mapping rules to
	convert stems to their respective lemmas with the vocalization defined by the
	pattern.},
  url       = {http://aclweb.org/anthology/W16-5306}
}

