@inproceedings{xu-etal-2019-treat,
title = "Treat the Word As a Whole or Look Inside? Subword Embeddings Model Language Change and Typology",
author = "Xu, Yang and
Zhang, Jiasheng and
Reitter, David",
editor = "Tahmasebi, Nina and
Borin, Lars and
Jatowt, Adam and
Xu, Yang",
booktitle = "Proceedings of the 1st International Workshop on Computational Approaches to Historical Language Change",
month = aug,
year = "2019",
address = "Florence, Italy",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W19-4717",
doi = "10.18653/v1/W19-4717",
pages = "136--145",
abstract = "We use a variant of word embedding model that incorporates subword information to characterize the degree of compositionality in lexical semantics. Our models reveal some interesting yet contrastive patterns of long-term change in multiple languages: Indo-European languages put more weight on subword units in newer words, while conversely Chinese puts less weights on the subwords, but more weight on the word as a whole. Our method provides novel evidence and methodology that enriches existing theories in evolutionary linguistics. The resulting word vectors also has decent performance in NLP-related tasks.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="xu-etal-2019-treat">
<titleInfo>
<title>Treat the Word As a Whole or Look Inside? Subword Embeddings Model Language Change and Typology</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yang</namePart>
<namePart type="family">Xu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jiasheng</namePart>
<namePart type="family">Zhang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">David</namePart>
<namePart type="family">Reitter</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-08</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 1st International Workshop on Computational Approaches to Historical Language Change</title>
</titleInfo>
<name type="personal">
<namePart type="given">Nina</namePart>
<namePart type="family">Tahmasebi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lars</namePart>
<namePart type="family">Borin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Adam</namePart>
<namePart type="family">Jatowt</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Yang</namePart>
<namePart type="family">Xu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Florence, Italy</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We use a variant of word embedding model that incorporates subword information to characterize the degree of compositionality in lexical semantics. Our models reveal some interesting yet contrastive patterns of long-term change in multiple languages: Indo-European languages put more weight on subword units in newer words, while conversely Chinese puts less weights on the subwords, but more weight on the word as a whole. Our method provides novel evidence and methodology that enriches existing theories in evolutionary linguistics. The resulting word vectors also has decent performance in NLP-related tasks.</abstract>
<identifier type="citekey">xu-etal-2019-treat</identifier>
<identifier type="doi">10.18653/v1/W19-4717</identifier>
<location>
<url>https://aclanthology.org/W19-4717</url>
</location>
<part>
<date>2019-08</date>
<extent unit="page">
<start>136</start>
<end>145</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Treat the Word As a Whole or Look Inside? Subword Embeddings Model Language Change and Typology
%A Xu, Yang
%A Zhang, Jiasheng
%A Reitter, David
%Y Tahmasebi, Nina
%Y Borin, Lars
%Y Jatowt, Adam
%Y Xu, Yang
%S Proceedings of the 1st International Workshop on Computational Approaches to Historical Language Change
%D 2019
%8 August
%I Association for Computational Linguistics
%C Florence, Italy
%F xu-etal-2019-treat
%X We use a variant of word embedding model that incorporates subword information to characterize the degree of compositionality in lexical semantics. Our models reveal some interesting yet contrastive patterns of long-term change in multiple languages: Indo-European languages put more weight on subword units in newer words, while conversely Chinese puts less weights on the subwords, but more weight on the word as a whole. Our method provides novel evidence and methodology that enriches existing theories in evolutionary linguistics. The resulting word vectors also has decent performance in NLP-related tasks.
%R 10.18653/v1/W19-4717
%U https://aclanthology.org/W19-4717
%U https://doi.org/10.18653/v1/W19-4717
%P 136-145
Markdown (Informal)
[Treat the Word As a Whole or Look Inside? Subword Embeddings Model Language Change and Typology](https://aclanthology.org/W19-4717) (Xu et al., LChange 2019)
ACL