@InProceedings{chernyak:2017:BSNLP,
  author    = {Chernyak, Ekaterina},
  title     = {Comparison of String Similarity Measures for Obscenity Filtering},
  booktitle = {Proceedings of the 6th Workshop on Balto-Slavic Natural Language Processing},
  month     = {April},
  year      = {2017},
  address   = {Valencia, Spain},
  publisher = {Association for Computational Linguistics},
  pages     = {97--101},
  abstract  = {In this paper we address the problem of filtering obscene lexis in Russian
	texts. We use string similarity measures to find words similar or identical to
	words from a stop list and establish both a test collection and a baseline for
	the task. Our experiments show that a novel string similarity measure based on
	the notion of an annotated suffix tree outperforms some of the other well known
	measures.},
  url       = {http://www.aclweb.org/anthology/W17-1415}
}

