@inproceedings{desilets-2010-webitext,
title = "{W}e{B}i{T}ext: Multilingual Concordancer Built from Public High Quality Web Content",
author = "D{\'e}silets, Alain",
booktitle = "Proceedings of the 9th Conference of the Association for Machine Translation in the Americas: Government MT User Program",
month = oct # " 31-" # nov # " 4",
year = "2010",
address = "Denver, Colorado, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2010.amta-government.13",
abstract = "In this paper, we describe WeBiText (www.webitext.ca) and how it is being used. WeBiText is a concordancer that allows translators to search in large, high-quality multilingual web sites, in order to find solutions to translation problems. After a quick overview of the system, we present results from an analysis of its logs, which provides a picture of how the tool is being used and how well it performs. We show that it is mostly used to find solutions for short, two or three word translation problems. The system produces at least one hit for 58{\%} of the queries, and hits from at least five different web pages in 41{\%} of cases. We show that 36{\%} of the queries correspond to specialized language problems, which is much higher than what was previously reported for a similar concordancer based on the Canadian Hansard (TransSearch). We also provide a back of the envelope calculation of the current economic impact of the tool, which we estimate at {\$}1 million per year, and growing rapidly.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="desilets-2010-webitext">
<titleInfo>
<title>WeBiText: Multilingual Concordancer Built from Public High Quality Web Content</title>
</titleInfo>
<name type="personal">
<namePart type="given">Alain</namePart>
<namePart type="family">Désilets</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2010-oct 31-nov 4</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 9th Conference of the Association for Machine Translation in the Americas: Government MT User Program</title>
</titleInfo>
<originInfo>
<publisher>Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">Denver, Colorado, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we describe WeBiText (www.webitext.ca) and how it is being used. WeBiText is a concordancer that allows translators to search in large, high-quality multilingual web sites, in order to find solutions to translation problems. After a quick overview of the system, we present results from an analysis of its logs, which provides a picture of how the tool is being used and how well it performs. We show that it is mostly used to find solutions for short, two or three word translation problems. The system produces at least one hit for 58% of the queries, and hits from at least five different web pages in 41% of cases. We show that 36% of the queries correspond to specialized language problems, which is much higher than what was previously reported for a similar concordancer based on the Canadian Hansard (TransSearch). We also provide a back of the envelope calculation of the current economic impact of the tool, which we estimate at $1 million per year, and growing rapidly.</abstract>
<identifier type="citekey">desilets-2010-webitext</identifier>
<location>
<url>https://aclanthology.org/2010.amta-government.13</url>
</location>
<part>
<date>2010-oct 31-nov 4</date>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T WeBiText: Multilingual Concordancer Built from Public High Quality Web Content
%A Désilets, Alain
%S Proceedings of the 9th Conference of the Association for Machine Translation in the Americas: Government MT User Program
%D 2010
%8 oct 31 nov 4
%I Association for Machine Translation in the Americas
%C Denver, Colorado, USA
%F desilets-2010-webitext
%X In this paper, we describe WeBiText (www.webitext.ca) and how it is being used. WeBiText is a concordancer that allows translators to search in large, high-quality multilingual web sites, in order to find solutions to translation problems. After a quick overview of the system, we present results from an analysis of its logs, which provides a picture of how the tool is being used and how well it performs. We show that it is mostly used to find solutions for short, two or three word translation problems. The system produces at least one hit for 58% of the queries, and hits from at least five different web pages in 41% of cases. We show that 36% of the queries correspond to specialized language problems, which is much higher than what was previously reported for a similar concordancer based on the Canadian Hansard (TransSearch). We also provide a back of the envelope calculation of the current economic impact of the tool, which we estimate at $1 million per year, and growing rapidly.
%U https://aclanthology.org/2010.amta-government.13
Markdown (Informal)
[WeBiText: Multilingual Concordancer Built from Public High Quality Web Content](https://aclanthology.org/2010.amta-government.13) (Désilets, AMTA 2010)
ACL