@InProceedings{raganato-EtAl:2016:LT4DH,
  author    = {Raganato, Alessandro  and  Camacho-Collados, Jose  and  Raganato, Antonio  and  Joung, Yunseo},
  title     = {Semantic Indexing of Multilingual Corpora and its Application on the History Domain},
  booktitle = {Proceedings of the Workshop on Language Technology Resources and Tools for Digital Humanities (LT4DH)},
  month     = {December},
  year      = {2016},
  address   = {Osaka, Japan},
  publisher = {The COLING 2016 Organizing Committee},
  pages     = {140--147},
  abstract  = {The increasing amount of multilingual text collections available in different
	domains makes its automatic processing essential for the development of a given
	field. However, standard processing techniques based on statistical clues and
	keyword searches have clear limitations. Instead, we propose a knowledge-based
	processing pipeline which overcomes most of the limitations of these
	techniques. This, in turn, enables direct comparison across texts in different
	languages without the need of translation. In this paper we show the potential
	of this approach for semantically indexing multilingual text collections in the
	history domain. In our experiments we used a version of the Bible translated in
	four different languages, evaluating the precision of our semantic indexing
	pipeline and showing its reliability on the cross-lingual text retrieval task.},
  url       = {http://aclweb.org/anthology/W16-4019}
}

