@inproceedings{koloski-etal-2021-interesting,
title = "Interesting cross-border news discovery using cross-lingual article linking and document similarity",
author = "Koloski, Boshko and
Zosa, Elaine and
Stepi{\v{s}}nik-Perdih, Timen and
{\v{S}}krlj, Bla{\v{z}} and
Paju, Tarmo and
Pollak, Senja",
editor = "Toivonen, Hannu and
Boggia, Michele",
booktitle = "Proceedings of the EACL Hackashop on News Media Content Analysis and Automated Report Generation",
month = apr,
year = "2021",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2021.hackashop-1.16",
pages = "116--120",
abstract = "Team Name: team-8 Embeddia Tool: Cross-Lingual Document Retrieval Zosa et al. Dataset: Estonian and Latvian news datasets abstract: Contemporary news media face increasing amounts of available data that can be of use when prioritizing, selecting and discovering new news. In this work we propose a methodology for retrieving interesting articles in a cross-border news discovery setting. More specifically, we explore how a set of seed documents in Estonian can be projected in Latvian document space and serve as a basis for discovery of novel interesting pieces of Latvian news that would interest Estonian readers. The proposed methodology was evaluated by Estonian journalist who confirmed that in the best setting, from top 10 retrieved Latvian documents, half of them represent news that are potentially interesting to be taken by the Estonian media house and presented to Estonian readers.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="koloski-etal-2021-interesting">
<titleInfo>
<title>Interesting cross-border news discovery using cross-lingual article linking and document similarity</title>
</titleInfo>
<name type="personal">
<namePart type="given">Boshko</namePart>
<namePart type="family">Koloski</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Elaine</namePart>
<namePart type="family">Zosa</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Timen</namePart>
<namePart type="family">Stepišnik-Perdih</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Blaž</namePart>
<namePart type="family">Škrlj</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tarmo</namePart>
<namePart type="family">Paju</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Senja</namePart>
<namePart type="family">Pollak</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2021-04</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the EACL Hackashop on News Media Content Analysis and Automated Report Generation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Hannu</namePart>
<namePart type="family">Toivonen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Michele</namePart>
<namePart type="family">Boggia</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Online</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Team Name: team-8 Embeddia Tool: Cross-Lingual Document Retrieval Zosa et al. Dataset: Estonian and Latvian news datasets abstract: Contemporary news media face increasing amounts of available data that can be of use when prioritizing, selecting and discovering new news. In this work we propose a methodology for retrieving interesting articles in a cross-border news discovery setting. More specifically, we explore how a set of seed documents in Estonian can be projected in Latvian document space and serve as a basis for discovery of novel interesting pieces of Latvian news that would interest Estonian readers. The proposed methodology was evaluated by Estonian journalist who confirmed that in the best setting, from top 10 retrieved Latvian documents, half of them represent news that are potentially interesting to be taken by the Estonian media house and presented to Estonian readers.</abstract>
<identifier type="citekey">koloski-etal-2021-interesting</identifier>
<location>
<url>https://aclanthology.org/2021.hackashop-1.16</url>
</location>
<part>
<date>2021-04</date>
<extent unit="page">
<start>116</start>
<end>120</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Interesting cross-border news discovery using cross-lingual article linking and document similarity
%A Koloski, Boshko
%A Zosa, Elaine
%A Stepišnik-Perdih, Timen
%A Škrlj, Blaž
%A Paju, Tarmo
%A Pollak, Senja
%Y Toivonen, Hannu
%Y Boggia, Michele
%S Proceedings of the EACL Hackashop on News Media Content Analysis and Automated Report Generation
%D 2021
%8 April
%I Association for Computational Linguistics
%C Online
%F koloski-etal-2021-interesting
%X Team Name: team-8 Embeddia Tool: Cross-Lingual Document Retrieval Zosa et al. Dataset: Estonian and Latvian news datasets abstract: Contemporary news media face increasing amounts of available data that can be of use when prioritizing, selecting and discovering new news. In this work we propose a methodology for retrieving interesting articles in a cross-border news discovery setting. More specifically, we explore how a set of seed documents in Estonian can be projected in Latvian document space and serve as a basis for discovery of novel interesting pieces of Latvian news that would interest Estonian readers. The proposed methodology was evaluated by Estonian journalist who confirmed that in the best setting, from top 10 retrieved Latvian documents, half of them represent news that are potentially interesting to be taken by the Estonian media house and presented to Estonian readers.
%U https://aclanthology.org/2021.hackashop-1.16
%P 116-120
Markdown (Informal)
[Interesting cross-border news discovery using cross-lingual article linking and document similarity](https://aclanthology.org/2021.hackashop-1.16) (Koloski et al., Hackashop 2021)
ACL