@inproceedings{zhang-tan-2021-textual,
title = "Textual Representations for Crosslingual Information Retrieval",
author = "Zhang, Hang and
Tan, Liling",
booktitle = "Proceedings of the 4th Workshop on e-Commerce and NLP",
month = aug,
year = "2021",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2021.ecnlp-1.14",
doi = "10.18653/v1/2021.ecnlp-1.14",
pages = "116--122",
abstract = "In this paper, we explored different levels of textual representations for cross-lingual information retrieval. Beyond the traditional token level representation, we adopted the subword and character level representations for information retrieval that had shown to improve neural machine translation by reducing the out-of-vocabulary issues in machine translation. We found that crosslingual information retrieval performance can be improved by combining search results from subwords and token level representation.Additionally, we improved the search performance by combining and re-ranking the result sets from the different text representations for German, French and Japanese.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="zhang-tan-2021-textual">
<titleInfo>
<title>Textual Representations for Crosslingual Information Retrieval</title>
</titleInfo>
<name type="personal">
<namePart type="given">Hang</namePart>
<namePart type="family">Zhang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Liling</namePart>
<namePart type="family">Tan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2021-08</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 4th Workshop on e-Commerce and NLP</title>
</titleInfo>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Online</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we explored different levels of textual representations for cross-lingual information retrieval. Beyond the traditional token level representation, we adopted the subword and character level representations for information retrieval that had shown to improve neural machine translation by reducing the out-of-vocabulary issues in machine translation. We found that crosslingual information retrieval performance can be improved by combining search results from subwords and token level representation.Additionally, we improved the search performance by combining and re-ranking the result sets from the different text representations for German, French and Japanese.</abstract>
<identifier type="citekey">zhang-tan-2021-textual</identifier>
<identifier type="doi">10.18653/v1/2021.ecnlp-1.14</identifier>
<location>
<url>https://aclanthology.org/2021.ecnlp-1.14</url>
</location>
<part>
<date>2021-08</date>
<extent unit="page">
<start>116</start>
<end>122</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Textual Representations for Crosslingual Information Retrieval
%A Zhang, Hang
%A Tan, Liling
%S Proceedings of the 4th Workshop on e-Commerce and NLP
%D 2021
%8 August
%I Association for Computational Linguistics
%C Online
%F zhang-tan-2021-textual
%X In this paper, we explored different levels of textual representations for cross-lingual information retrieval. Beyond the traditional token level representation, we adopted the subword and character level representations for information retrieval that had shown to improve neural machine translation by reducing the out-of-vocabulary issues in machine translation. We found that crosslingual information retrieval performance can be improved by combining search results from subwords and token level representation.Additionally, we improved the search performance by combining and re-ranking the result sets from the different text representations for German, French and Japanese.
%R 10.18653/v1/2021.ecnlp-1.14
%U https://aclanthology.org/2021.ecnlp-1.14
%U https://doi.org/10.18653/v1/2021.ecnlp-1.14
%P 116-122
Markdown (Informal)
[Textual Representations for Crosslingual Information Retrieval](https://aclanthology.org/2021.ecnlp-1.14) (Zhang & Tan, ECNLP 2021)
ACL