@InProceedings{wiedemann-yimam-biemann:2018:Demos,
  author    = {Wiedemann, Gregor  and  Yimam, Seid Muhie  and  Biemann, Chris},
  title     = {A Multilingual Information Extraction Pipeline for Investigative Journalism},
  booktitle = {Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing: System Demonstrations},
  month     = {November},
  year      = {2018},
  address   = {Brussels, Belgium},
  publisher = {Association for Computational Linguistics},
  pages     = {78--83},
  abstract  = {We introduce an advanced information extraction pipeline to automatically process very large collections of unstructured textual data for the purpose of investigative journalism. The pipeline serves as a new input processor for the upcoming major release of our New/s/leak 2.0 software, which we develop in cooperation with a large German news organization. The use case is that journalists receive a large collection of files up to several Gigabytes containing unknown contents. Collections may originate either from official disclosures of documents, e.g. Freedom of Information Act requests, or unofficial data leaks. },
  url       = {http://www.aclweb.org/anthology/D18-2014}
}

