@InProceedings{scherrer-rabus:2017:VarDial,
  author    = {Scherrer, Yves  and  Rabus, Achim},
  title     = {Multi-source morphosyntactic tagging for spoken Rusyn},
  booktitle = {Proceedings of the Fourth Workshop on NLP for Similar Languages, Varieties and Dialects (VarDial)},
  month     = {April},
  year      = {2017},
  address   = {Valencia, Spain},
  publisher = {Association for Computational Linguistics},
  pages     = {84--92},
  abstract  = {This paper deals with the development of morphosyntactic taggers for spoken
	varieties of the Slavic minority language Rusyn. As neither annotated corpora
	nor parallel corpora are electronically available for Rusyn, we propose to
	combine existing resources from the etymologically close Slavic languages
	Russian, Ukrainian, Slovak, and Polish and adapt them to Rusyn. Using MarMoT as
	tagging toolkit, we show that a tagger trained on a balanced set of the four
	source languages outperforms single language taggers by about 9%, and that
	additional automatically induced morphosyntactic lexicons lead to further
	improvements. The best observed accuracies for Rusyn are 82.4% for
	part-of-speech tagging and 75.5% for full morphological tagging.},
  url       = {http://www.aclweb.org/anthology/W17-1210}
}

