@inproceedings{germann-etal-2018-integrating,
title = "Integrating Multiple {NLP} Technologies into an Open-source Platform for Multilingual Media Monitoring",
author = "Germann, Ulrich and
Liepins, Ren{\=a}rs and
Gosko, Didzis and
Barzdins, Guntis",
editor = "Park, Eunjeong L. and
Hagiwara, Masato and
Milajevs, Dmitrijs and
Tan, Liling",
booktitle = "Proceedings of Workshop for {NLP} Open Source Software ({NLP}-{OSS})",
month = jul,
year = "2018",
address = "Melbourne, Australia",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W18-2508",
doi = "10.18653/v1/W18-2508",
pages = "47--51",
abstract = "The open-source SUMMA Platform is a highly scalable distributed architecture for monitoring a large number of media broadcasts in parallel, with a lag behind actual broadcast time of at most a few minutes. It assembles numerous state-of-the-art NLP technologies into a fully automated media ingestion pipeline that can record live broadcasts, detect and transcribe spoken content, translate from several languages (original text or transcribed speech) into English, recognize Named Entities, detect topics, cluster and summarize documents across language barriers, and extract and store factual claims in these news items. This paper describes the intended use cases and discusses the system design decisions that allowed us to integrate state-of-the-art NLP modules into an effective workflow with comparatively little effort.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="germann-etal-2018-integrating">
<titleInfo>
<title>Integrating Multiple NLP Technologies into an Open-source Platform for Multilingual Media Monitoring</title>
</titleInfo>
<name type="personal">
<namePart type="given">Ulrich</namePart>
<namePart type="family">Germann</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Renārs</namePart>
<namePart type="family">Liepins</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Didzis</namePart>
<namePart type="family">Gosko</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Guntis</namePart>
<namePart type="family">Barzdins</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2018-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of Workshop for NLP Open Source Software (NLP-OSS)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Eunjeong</namePart>
<namePart type="given">L</namePart>
<namePart type="family">Park</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Masato</namePart>
<namePart type="family">Hagiwara</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Dmitrijs</namePart>
<namePart type="family">Milajevs</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Liling</namePart>
<namePart type="family">Tan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Melbourne, Australia</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>The open-source SUMMA Platform is a highly scalable distributed architecture for monitoring a large number of media broadcasts in parallel, with a lag behind actual broadcast time of at most a few minutes. It assembles numerous state-of-the-art NLP technologies into a fully automated media ingestion pipeline that can record live broadcasts, detect and transcribe spoken content, translate from several languages (original text or transcribed speech) into English, recognize Named Entities, detect topics, cluster and summarize documents across language barriers, and extract and store factual claims in these news items. This paper describes the intended use cases and discusses the system design decisions that allowed us to integrate state-of-the-art NLP modules into an effective workflow with comparatively little effort.</abstract>
<identifier type="citekey">germann-etal-2018-integrating</identifier>
<identifier type="doi">10.18653/v1/W18-2508</identifier>
<location>
<url>https://aclanthology.org/W18-2508</url>
</location>
<part>
<date>2018-07</date>
<extent unit="page">
<start>47</start>
<end>51</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Integrating Multiple NLP Technologies into an Open-source Platform for Multilingual Media Monitoring
%A Germann, Ulrich
%A Liepins, Renārs
%A Gosko, Didzis
%A Barzdins, Guntis
%Y Park, Eunjeong L.
%Y Hagiwara, Masato
%Y Milajevs, Dmitrijs
%Y Tan, Liling
%S Proceedings of Workshop for NLP Open Source Software (NLP-OSS)
%D 2018
%8 July
%I Association for Computational Linguistics
%C Melbourne, Australia
%F germann-etal-2018-integrating
%X The open-source SUMMA Platform is a highly scalable distributed architecture for monitoring a large number of media broadcasts in parallel, with a lag behind actual broadcast time of at most a few minutes. It assembles numerous state-of-the-art NLP technologies into a fully automated media ingestion pipeline that can record live broadcasts, detect and transcribe spoken content, translate from several languages (original text or transcribed speech) into English, recognize Named Entities, detect topics, cluster and summarize documents across language barriers, and extract and store factual claims in these news items. This paper describes the intended use cases and discusses the system design decisions that allowed us to integrate state-of-the-art NLP modules into an effective workflow with comparatively little effort.
%R 10.18653/v1/W18-2508
%U https://aclanthology.org/W18-2508
%U https://doi.org/10.18653/v1/W18-2508
%P 47-51
Markdown (Informal)
[Integrating Multiple NLP Technologies into an Open-source Platform for Multilingual Media Monitoring](https://aclanthology.org/W18-2508) (Germann et al., NLPOSS 2018)
ACL