@InProceedings{rabus-scherrer:2017:BSNLP,
  author    = {Rabus, Achim  and  Scherrer, Yves},
  title     = {Lexicon Induction for Spoken Rusyn -- Challenges and Results},
  booktitle = {Proceedings of the 6th Workshop on Balto-Slavic Natural Language Processing},
  month     = {April},
  year      = {2017},
  address   = {Valencia, Spain},
  publisher = {Association for Computational Linguistics},
  pages     = {27--32},
  abstract  = {This paper reports on challenges and results in developing NLP resources for
	spoken Rusyn. Being a Slavic minority language, Rusyn does not have any
	resources to make use of. We propose to build a morphosyntactic dictionary for
	Rusyn, combining existing resources from the etymologically close Slavic
	languages Russian, Ukrainian, Slovak, and Polish. We adapt these resources to
	Rusyn by using vowel-sensitive Levenshtein distance, hand-written
	language-specific transformation rules, and combinations of the two. Compared
	to an exact match baseline, we increase the coverage of the resulting
	morphological dictionary by up to 77.4% relative (42.9% absolute), which
	results in a tagging recall increased by 11.6% relative (9.1% absolute). Our
	research confirms and expands the results of previous studies showing the
	efficiency of using NLP resources from neighboring languages for low-resourced
	languages.},
  url       = {http://www.aclweb.org/anthology/W17-1405}
}

