@inproceedings{mccrae-2019-identification,
title = "Identification of Adjective-Noun Neologisms using Pretrained Language Models",
author = "McCrae, John Philip",
editor = "Savary, Agata and
Escart{\'\i}n, Carla Parra and
Bond, Francis and
Mitrovi{\'c}, Jelena and
Mititelu, Verginica Barbu",
booktitle = "Proceedings of the Joint Workshop on Multiword Expressions and WordNet (MWE-WN 2019)",
month = aug,
year = "2019",
address = "Florence, Italy",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W19-5116",
doi = "10.18653/v1/W19-5116",
pages = "135--141",
abstract = "Neologism detection is a key task in the constructing of lexical resources and has wider implications for NLP, however the identification of multiword neologisms has received little attention. In this paper, we show that we can effectively identify the distinction between compositional and non-compositional adjective-noun pairs by using pretrained language models and comparing this with individual word embeddings. Our results show that the use of these models significantly improves over baseline linguistic features, however the combination with linguistic features still further improves the results, suggesting the strength of a hybrid approach.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="mccrae-2019-identification">
<titleInfo>
<title>Identification of Adjective-Noun Neologisms using Pretrained Language Models</title>
</titleInfo>
<name type="personal">
<namePart type="given">John</namePart>
<namePart type="given">Philip</namePart>
<namePart type="family">McCrae</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-08</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Joint Workshop on Multiword Expressions and WordNet (MWE-WN 2019)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Agata</namePart>
<namePart type="family">Savary</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Carla</namePart>
<namePart type="given">Parra</namePart>
<namePart type="family">Escartín</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Francis</namePart>
<namePart type="family">Bond</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jelena</namePart>
<namePart type="family">Mitrović</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Verginica</namePart>
<namePart type="given">Barbu</namePart>
<namePart type="family">Mititelu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Florence, Italy</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Neologism detection is a key task in the constructing of lexical resources and has wider implications for NLP, however the identification of multiword neologisms has received little attention. In this paper, we show that we can effectively identify the distinction between compositional and non-compositional adjective-noun pairs by using pretrained language models and comparing this with individual word embeddings. Our results show that the use of these models significantly improves over baseline linguistic features, however the combination with linguistic features still further improves the results, suggesting the strength of a hybrid approach.</abstract>
<identifier type="citekey">mccrae-2019-identification</identifier>
<identifier type="doi">10.18653/v1/W19-5116</identifier>
<location>
<url>https://aclanthology.org/W19-5116</url>
</location>
<part>
<date>2019-08</date>
<extent unit="page">
<start>135</start>
<end>141</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Identification of Adjective-Noun Neologisms using Pretrained Language Models
%A McCrae, John Philip
%Y Savary, Agata
%Y Escartín, Carla Parra
%Y Bond, Francis
%Y Mitrović, Jelena
%Y Mititelu, Verginica Barbu
%S Proceedings of the Joint Workshop on Multiword Expressions and WordNet (MWE-WN 2019)
%D 2019
%8 August
%I Association for Computational Linguistics
%C Florence, Italy
%F mccrae-2019-identification
%X Neologism detection is a key task in the constructing of lexical resources and has wider implications for NLP, however the identification of multiword neologisms has received little attention. In this paper, we show that we can effectively identify the distinction between compositional and non-compositional adjective-noun pairs by using pretrained language models and comparing this with individual word embeddings. Our results show that the use of these models significantly improves over baseline linguistic features, however the combination with linguistic features still further improves the results, suggesting the strength of a hybrid approach.
%R 10.18653/v1/W19-5116
%U https://aclanthology.org/W19-5116
%U https://doi.org/10.18653/v1/W19-5116
%P 135-141
Markdown (Informal)
[Identification of Adjective-Noun Neologisms using Pretrained Language Models](https://aclanthology.org/W19-5116) (McCrae, MWE 2019)
ACL