@InProceedings{walther-sagot:2017:LaTeCH-CLfL,
  author    = {Walther, G\'{e}raldine  and  Sagot, Beno\^{i}t},
  title     = {Speeding up corpus development for linguistic research: language documentation and acquisition in Romansh Tuatschin},
  booktitle = {Proceedings of the Joint SIGHUM Workshop on Computational Linguistics for Cultural Heritage, Social Sciences, Humanities and Literature},
  month     = {August},
  year      = {2017},
  address   = {Vancouver, Canada},
  publisher = {Association for Computational Linguistics},
  pages     = {89--94},
  abstract  = {In this paper, we present ongoing work for developing language resources and
	basic NLP tools for an undocumented variety of Romansh, in the context of a
	language documentation and language acquisition project. Our tools are meant to
	improve the speed and reliability of corpus annotations for noisy data
	involving large amounts of code-switching, occurrences of child-speech and
	orthographic noise. Being able to increase the efficiency of language resource
	development for language documentation and acquisition research also
	constitutes a step towards solving the data sparsity issues with which
	researchers have been struggling.},
  url       = {http://www.aclweb.org/anthology/W17-2212}
}

