@inproceedings{schaefer-etal-2022-selecting,
title = "On Selecting Training Corpora for Cross-Domain Claim Detection",
author = "Schaefer, Robin and
Knaebel, Ren{\'e} and
Stede, Manfred",
editor = "Lapesa, Gabriella and
Schneider, Jodi and
Jo, Yohan and
Saha, Sougata",
booktitle = "Proceedings of the 9th Workshop on Argument Mining",
month = oct,
year = "2022",
address = "Online and in Gyeongju, Republic of Korea",
publisher = "International Conference on Computational Linguistics",
url = "https://aclanthology.org/2022.argmining-1.17",
pages = "181--186",
abstract = "Identifying claims in text is a crucial first step in argument mining. In this paper, we investigate factors for the composition of training corpora to improve cross-domain claim detection. To this end, we use four recent argumentation corpora annotated with claims and submit them to several experimental scenarios. Our results indicate that the {``}ideal{''} composition of training corpora is characterized by a large corpus size, homogeneous claim proportions, and less formal text domains.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="schaefer-etal-2022-selecting">
<titleInfo>
<title>On Selecting Training Corpora for Cross-Domain Claim Detection</title>
</titleInfo>
<name type="personal">
<namePart type="given">Robin</namePart>
<namePart type="family">Schaefer</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">René</namePart>
<namePart type="family">Knaebel</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Manfred</namePart>
<namePart type="family">Stede</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2022-10</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 9th Workshop on Argument Mining</title>
</titleInfo>
<name type="personal">
<namePart type="given">Gabriella</namePart>
<namePart type="family">Lapesa</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jodi</namePart>
<namePart type="family">Schneider</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Yohan</namePart>
<namePart type="family">Jo</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Sougata</namePart>
<namePart type="family">Saha</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>International Conference on Computational Linguistics</publisher>
<place>
<placeTerm type="text">Online and in Gyeongju, Republic of Korea</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Identifying claims in text is a crucial first step in argument mining. In this paper, we investigate factors for the composition of training corpora to improve cross-domain claim detection. To this end, we use four recent argumentation corpora annotated with claims and submit them to several experimental scenarios. Our results indicate that the “ideal” composition of training corpora is characterized by a large corpus size, homogeneous claim proportions, and less formal text domains.</abstract>
<identifier type="citekey">schaefer-etal-2022-selecting</identifier>
<location>
<url>https://aclanthology.org/2022.argmining-1.17</url>
</location>
<part>
<date>2022-10</date>
<extent unit="page">
<start>181</start>
<end>186</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T On Selecting Training Corpora for Cross-Domain Claim Detection
%A Schaefer, Robin
%A Knaebel, René
%A Stede, Manfred
%Y Lapesa, Gabriella
%Y Schneider, Jodi
%Y Jo, Yohan
%Y Saha, Sougata
%S Proceedings of the 9th Workshop on Argument Mining
%D 2022
%8 October
%I International Conference on Computational Linguistics
%C Online and in Gyeongju, Republic of Korea
%F schaefer-etal-2022-selecting
%X Identifying claims in text is a crucial first step in argument mining. In this paper, we investigate factors for the composition of training corpora to improve cross-domain claim detection. To this end, we use four recent argumentation corpora annotated with claims and submit them to several experimental scenarios. Our results indicate that the “ideal” composition of training corpora is characterized by a large corpus size, homogeneous claim proportions, and less formal text domains.
%U https://aclanthology.org/2022.argmining-1.17
%P 181-186
Markdown (Informal)
[On Selecting Training Corpora for Cross-Domain Claim Detection](https://aclanthology.org/2022.argmining-1.17) (Schaefer et al., ArgMining 2022)
ACL