@inproceedings{yerastov-2025-modeling,
title = "Modeling Constructional Prototypes with Sentence-{BERT}",
author = "Yerastov, Yuri V.",
editor = "Bonial, Claire and
Torgbi, Melissa and
Weissweiler, Leonie and
Blodgett, Austin and
Beuls, Katrien and
Van Eecke, Paul and
Tayyar Madabushi, Harish",
booktitle = "Proceedings of the Second International Workshop on Construction Grammars and NLP",
month = sep,
year = "2025",
address = {D{\"u}sseldorf, Germany},
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2025.cxgsnlp-1.3/",
pages = "24--33",
ISBN = "979-8-89176-318-0",
abstract = "This paper applies Sentence-Bert embeddings to the analysis of three competing constructions in Canadian English: \textit{be} perfect, predicate adjective and \textit{have} perfect. Samples are drawn from a Canadian news media database. Constructional exemplars are vectorized and mean-pooled to create constructional centroids, from which top-ranked exemplars and cross-construction similarities are calculated. Clause type distribution and definiteness marking are also examined. The embeddings-based analysis is cross-validated by a traditional quantitative study, and both lines of inquiry converge on the following tendencies: (1) prevalence of embedded {--} and particularly adverbial {--} clauses in the \textit{be} perfect and predicate adjective constructions, (2) prevalence of matrix clauses in the \textit{have} perfect, (3) prevalence of definiteness marking in the direct object of the \textit{be} perfect, and (4) greater statistical similarities between \textit{be} perfects and predicate adjectives. These findings support the argument that \textit{be} perfects function as topic-marking constructions within a usage-based framework."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="yerastov-2025-modeling">
<titleInfo>
<title>Modeling Constructional Prototypes with Sentence-BERT</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yuri</namePart>
<namePart type="given">V</namePart>
<namePart type="family">Yerastov</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2025-09</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Second International Workshop on Construction Grammars and NLP</title>
</titleInfo>
<name type="personal">
<namePart type="given">Claire</namePart>
<namePart type="family">Bonial</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Melissa</namePart>
<namePart type="family">Torgbi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Leonie</namePart>
<namePart type="family">Weissweiler</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Austin</namePart>
<namePart type="family">Blodgett</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Katrien</namePart>
<namePart type="family">Beuls</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Paul</namePart>
<namePart type="family">Van Eecke</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Harish</namePart>
<namePart type="family">Tayyar Madabushi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Düsseldorf, Germany</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-318-0</identifier>
</relatedItem>
<abstract>This paper applies Sentence-Bert embeddings to the analysis of three competing constructions in Canadian English: be perfect, predicate adjective and have perfect. Samples are drawn from a Canadian news media database. Constructional exemplars are vectorized and mean-pooled to create constructional centroids, from which top-ranked exemplars and cross-construction similarities are calculated. Clause type distribution and definiteness marking are also examined. The embeddings-based analysis is cross-validated by a traditional quantitative study, and both lines of inquiry converge on the following tendencies: (1) prevalence of embedded – and particularly adverbial – clauses in the be perfect and predicate adjective constructions, (2) prevalence of matrix clauses in the have perfect, (3) prevalence of definiteness marking in the direct object of the be perfect, and (4) greater statistical similarities between be perfects and predicate adjectives. These findings support the argument that be perfects function as topic-marking constructions within a usage-based framework.</abstract>
<identifier type="citekey">yerastov-2025-modeling</identifier>
<location>
<url>https://aclanthology.org/2025.cxgsnlp-1.3/</url>
</location>
<part>
<date>2025-09</date>
<extent unit="page">
<start>24</start>
<end>33</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Modeling Constructional Prototypes with Sentence-BERT
%A Yerastov, Yuri V.
%Y Bonial, Claire
%Y Torgbi, Melissa
%Y Weissweiler, Leonie
%Y Blodgett, Austin
%Y Beuls, Katrien
%Y Van Eecke, Paul
%Y Tayyar Madabushi, Harish
%S Proceedings of the Second International Workshop on Construction Grammars and NLP
%D 2025
%8 September
%I Association for Computational Linguistics
%C Düsseldorf, Germany
%@ 979-8-89176-318-0
%F yerastov-2025-modeling
%X This paper applies Sentence-Bert embeddings to the analysis of three competing constructions in Canadian English: be perfect, predicate adjective and have perfect. Samples are drawn from a Canadian news media database. Constructional exemplars are vectorized and mean-pooled to create constructional centroids, from which top-ranked exemplars and cross-construction similarities are calculated. Clause type distribution and definiteness marking are also examined. The embeddings-based analysis is cross-validated by a traditional quantitative study, and both lines of inquiry converge on the following tendencies: (1) prevalence of embedded – and particularly adverbial – clauses in the be perfect and predicate adjective constructions, (2) prevalence of matrix clauses in the have perfect, (3) prevalence of definiteness marking in the direct object of the be perfect, and (4) greater statistical similarities between be perfects and predicate adjectives. These findings support the argument that be perfects function as topic-marking constructions within a usage-based framework.
%U https://aclanthology.org/2025.cxgsnlp-1.3/
%P 24-33
Markdown (Informal)
[Modeling Constructional Prototypes with Sentence-BERT](https://aclanthology.org/2025.cxgsnlp-1.3/) (Yerastov, CxGsNLP 2025)
ACL