@inproceedings{thanopoulos-etal-2003-text,
title = "Text Tokenization for Knowledge-free Automatic Extraction of Lexical Similarities",
author = "Thanopoulos, Aristomenis and
Fakotakis, Nikos and
Kokkinakis, George",
editor = "Daille, B{\'e}atrice and
Morin, Emmanuel",
booktitle = "Actes de la 10{\`e}me conf{\'e}rence sur le Traitement Automatique des Langues Naturelles. Posters",
month = jun,
year = "2003",
address = "Batz-sur-Mer, France",
publisher = "ATALA",
url = "https://aclanthology.org/2003.jeptalnrecital-poster.17",
pages = "397--402",
abstract = "Previous studies on automatic extraction of lexical similarities have considered as semantic unit of text the word. However, the theory of contextual lexical semantics implies that larger segments of text, namely non-compositional multiwords, are more appropriate for this role. We experimentally tested the applicability of this notion applying automatic collocation extraction to identify and merge such multiwords prior to the similarity estimation process. Employing an automatic WordNet-based comparative evaluation scheme along with a manual evaluation procedure, we ascertain improvement of the extracted similarity relations.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="thanopoulos-etal-2003-text">
<titleInfo>
<title>Text Tokenization for Knowledge-free Automatic Extraction of Lexical Similarities</title>
</titleInfo>
<name type="personal">
<namePart type="given">Aristomenis</namePart>
<namePart type="family">Thanopoulos</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nikos</namePart>
<namePart type="family">Fakotakis</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">George</namePart>
<namePart type="family">Kokkinakis</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2003-06</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Actes de la 10ème conférence sur le Traitement Automatique des Langues Naturelles. Posters</title>
</titleInfo>
<name type="personal">
<namePart type="given">Béatrice</namePart>
<namePart type="family">Daille</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Emmanuel</namePart>
<namePart type="family">Morin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>ATALA</publisher>
<place>
<placeTerm type="text">Batz-sur-Mer, France</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Previous studies on automatic extraction of lexical similarities have considered as semantic unit of text the word. However, the theory of contextual lexical semantics implies that larger segments of text, namely non-compositional multiwords, are more appropriate for this role. We experimentally tested the applicability of this notion applying automatic collocation extraction to identify and merge such multiwords prior to the similarity estimation process. Employing an automatic WordNet-based comparative evaluation scheme along with a manual evaluation procedure, we ascertain improvement of the extracted similarity relations.</abstract>
<identifier type="citekey">thanopoulos-etal-2003-text</identifier>
<location>
<url>https://aclanthology.org/2003.jeptalnrecital-poster.17</url>
</location>
<part>
<date>2003-06</date>
<extent unit="page">
<start>397</start>
<end>402</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Text Tokenization for Knowledge-free Automatic Extraction of Lexical Similarities
%A Thanopoulos, Aristomenis
%A Fakotakis, Nikos
%A Kokkinakis, George
%Y Daille, Béatrice
%Y Morin, Emmanuel
%S Actes de la 10ème conférence sur le Traitement Automatique des Langues Naturelles. Posters
%D 2003
%8 June
%I ATALA
%C Batz-sur-Mer, France
%F thanopoulos-etal-2003-text
%X Previous studies on automatic extraction of lexical similarities have considered as semantic unit of text the word. However, the theory of contextual lexical semantics implies that larger segments of text, namely non-compositional multiwords, are more appropriate for this role. We experimentally tested the applicability of this notion applying automatic collocation extraction to identify and merge such multiwords prior to the similarity estimation process. Employing an automatic WordNet-based comparative evaluation scheme along with a manual evaluation procedure, we ascertain improvement of the extracted similarity relations.
%U https://aclanthology.org/2003.jeptalnrecital-poster.17
%P 397-402
Markdown (Informal)
[Text Tokenization for Knowledge-free Automatic Extraction of Lexical Similarities](https://aclanthology.org/2003.jeptalnrecital-poster.17) (Thanopoulos et al., JEP/TALN/RECITAL 2003)
ACL