@article{krstev-etal-2025-light,
title = "Light Verb Constructions in {ELEXIS-WSD} {--} Annotation, Comparisons and Issues",
author = "Krstev, Cvetana and
Stankovi{\'c}, Ranka and
Markovi{\'c}, Aleksandra",
editor = "Koeva, Svetla",
journal = "Journal Computational Linguistics in Bulgaria",
volume = "1",
month = jul,
year = "2025",
address = "Sofia, Bulgaria",
publisher = "Institute for Bulgarian Language, Department of Computational Linguistics, Bulgarian Academy of Sciences",
url = "https://aclanthology.org/2025.jclib-1.3/",
doi = "10.47810/JCLIB.1.2025.03",
pages = "42--60",
abstract = "This paper deals with light verb constructions and their annotation in ELEXIS-sr, the Serbian extension of the ELEXIS-WSD corpus. In Section 1, general introductory remarks are given about these constructions, the notion of light verbs, and their treatment and further classification in the PARSEME annotation guidelines (subtypes LVC.full and LVC.cause). Section 2 offers an insight into ELEXIS-WSD corpus, annotated with VMWEs for several languages, with a remark that these VMWEs were not further subcategorised into finer classes. For this paper, we classified them ourselves to facilitate comparisons of the LVCs annotated in ELEXIS-sr. Tools and resources used for the automatic annotation of ELEXIS-sr are presented in Section 3, as well as the results of manual checking. In Section 4, we offer a comparison of LVCs in four ELEXIS-WSD sub-collections: Serbian, Bulgarian, Slovene, and English. We use Serbian as a starting point for this comparison, as it has been thoroughly annotated with MWEs (and NEs). We present the results of the comparison of all the occurrences of LVCs in the Serbian extension with their occurrences and annotation both in ELEXIS-WSD and Parseme sub-corpora for other languages. An important conclusion is that the most equivalents among LVCs are between Serbian and Bulgarian, closely related Slavic languages (a total of 34 equivalents), while between Serbian and Slovene, also Slavic, there are 11 equivalents, as between Serbian and English. It seems that this could be explained by the number of VMWES and LVCs annotated, or by the strategy used by different annotators."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="krstev-etal-2025-light">
<titleInfo>
<title>Light Verb Constructions in ELEXIS-WSD – Annotation, Comparisons and Issues</title>
</titleInfo>
<name type="personal">
<namePart type="given">Cvetana</namePart>
<namePart type="family">Krstev</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ranka</namePart>
<namePart type="family">Stanković</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Aleksandra</namePart>
<namePart type="family">Marković</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2025-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<genre authority="bibutilsgt">journal article</genre>
<relatedItem type="host">
<titleInfo>
<title>Journal Computational Linguistics in Bulgaria</title>
</titleInfo>
<originInfo>
<issuance>continuing</issuance>
<publisher>Institute for Bulgarian Language, Department of Computational Linguistics, Bulgarian Academy of Sciences</publisher>
<place>
<placeTerm type="text">Sofia, Bulgaria</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">periodical</genre>
<genre authority="bibutilsgt">academic journal</genre>
</relatedItem>
<abstract>This paper deals with light verb constructions and their annotation in ELEXIS-sr, the Serbian extension of the ELEXIS-WSD corpus. In Section 1, general introductory remarks are given about these constructions, the notion of light verbs, and their treatment and further classification in the PARSEME annotation guidelines (subtypes LVC.full and LVC.cause). Section 2 offers an insight into ELEXIS-WSD corpus, annotated with VMWEs for several languages, with a remark that these VMWEs were not further subcategorised into finer classes. For this paper, we classified them ourselves to facilitate comparisons of the LVCs annotated in ELEXIS-sr. Tools and resources used for the automatic annotation of ELEXIS-sr are presented in Section 3, as well as the results of manual checking. In Section 4, we offer a comparison of LVCs in four ELEXIS-WSD sub-collections: Serbian, Bulgarian, Slovene, and English. We use Serbian as a starting point for this comparison, as it has been thoroughly annotated with MWEs (and NEs). We present the results of the comparison of all the occurrences of LVCs in the Serbian extension with their occurrences and annotation both in ELEXIS-WSD and Parseme sub-corpora for other languages. An important conclusion is that the most equivalents among LVCs are between Serbian and Bulgarian, closely related Slavic languages (a total of 34 equivalents), while between Serbian and Slovene, also Slavic, there are 11 equivalents, as between Serbian and English. It seems that this could be explained by the number of VMWES and LVCs annotated, or by the strategy used by different annotators.</abstract>
<identifier type="citekey">krstev-etal-2025-light</identifier>
<identifier type="doi">10.47810/JCLIB.1.2025.03</identifier>
<location>
<url>https://aclanthology.org/2025.jclib-1.3/</url>
</location>
<part>
<date>2025-07</date>
<detail type="volume"><number>1</number></detail>
<extent unit="page">
<start>42</start>
<end>60</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Journal Article
%T Light Verb Constructions in ELEXIS-WSD – Annotation, Comparisons and Issues
%A Krstev, Cvetana
%A Stanković, Ranka
%A Marković, Aleksandra
%J Journal Computational Linguistics in Bulgaria
%D 2025
%8 July
%V 1
%I Institute for Bulgarian Language, Department of Computational Linguistics, Bulgarian Academy of Sciences
%C Sofia, Bulgaria
%F krstev-etal-2025-light
%X This paper deals with light verb constructions and their annotation in ELEXIS-sr, the Serbian extension of the ELEXIS-WSD corpus. In Section 1, general introductory remarks are given about these constructions, the notion of light verbs, and their treatment and further classification in the PARSEME annotation guidelines (subtypes LVC.full and LVC.cause). Section 2 offers an insight into ELEXIS-WSD corpus, annotated with VMWEs for several languages, with a remark that these VMWEs were not further subcategorised into finer classes. For this paper, we classified them ourselves to facilitate comparisons of the LVCs annotated in ELEXIS-sr. Tools and resources used for the automatic annotation of ELEXIS-sr are presented in Section 3, as well as the results of manual checking. In Section 4, we offer a comparison of LVCs in four ELEXIS-WSD sub-collections: Serbian, Bulgarian, Slovene, and English. We use Serbian as a starting point for this comparison, as it has been thoroughly annotated with MWEs (and NEs). We present the results of the comparison of all the occurrences of LVCs in the Serbian extension with their occurrences and annotation both in ELEXIS-WSD and Parseme sub-corpora for other languages. An important conclusion is that the most equivalents among LVCs are between Serbian and Bulgarian, closely related Slavic languages (a total of 34 equivalents), while between Serbian and Slovene, also Slavic, there are 11 equivalents, as between Serbian and English. It seems that this could be explained by the number of VMWES and LVCs annotated, or by the strategy used by different annotators.
%R 10.47810/JCLIB.1.2025.03
%U https://aclanthology.org/2025.jclib-1.3/
%U https://doi.org/10.47810/JCLIB.1.2025.03
%P 42-60
Markdown (Informal)
[Light Verb Constructions in ELEXIS-WSD – Annotation, Comparisons and Issues](https://aclanthology.org/2025.jclib-1.3/) (Krstev et al., JCLIB 2025)
ACL