@inproceedings{andresen-zinsmeister-2017-approximating,
title = "Approximating Style by N-gram-based Annotation",
author = "Andresen, Melanie and
Zinsmeister, Heike",
editor = "Brooke, Julian and
Solorio, Thamar and
Koppel, Moshe",
booktitle = "Proceedings of the Workshop on Stylistic Variation",
month = sep,
year = "2017",
address = "Copenhagen, Denmark",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W17-4913",
doi = "10.18653/v1/W17-4913",
pages = "105--115",
abstract = "The concept of style is much debated in theoretical as well as empirical terms. From an empirical perspective, the key question is how to operationalize style and thus make it accessible for annotation and quantification. In authorship attribution, many different approaches have successfully resolved this issue at the cost of linguistic interpretability: The resulting algorithms may be able to distinguish one language variety from the other, but do not give us much information on their distinctive linguistic properties. We approach the issue of interpreting stylistic features by extracting linear and syntactic n-grams that are distinctive for a language variety. We present a study that exemplifies this process by a comparison of the German academic languages of linguistics and literary studies. Overall, our findings show that distinctive n-grams can be related to linguistic categories. The results suggest that the style of German literary studies is characterized by nominal structures and the style of linguistics by verbal ones.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="andresen-zinsmeister-2017-approximating">
<titleInfo>
<title>Approximating Style by N-gram-based Annotation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Melanie</namePart>
<namePart type="family">Andresen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Heike</namePart>
<namePart type="family">Zinsmeister</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2017-09</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Workshop on Stylistic Variation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Julian</namePart>
<namePart type="family">Brooke</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Thamar</namePart>
<namePart type="family">Solorio</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Moshe</namePart>
<namePart type="family">Koppel</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Copenhagen, Denmark</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>The concept of style is much debated in theoretical as well as empirical terms. From an empirical perspective, the key question is how to operationalize style and thus make it accessible for annotation and quantification. In authorship attribution, many different approaches have successfully resolved this issue at the cost of linguistic interpretability: The resulting algorithms may be able to distinguish one language variety from the other, but do not give us much information on their distinctive linguistic properties. We approach the issue of interpreting stylistic features by extracting linear and syntactic n-grams that are distinctive for a language variety. We present a study that exemplifies this process by a comparison of the German academic languages of linguistics and literary studies. Overall, our findings show that distinctive n-grams can be related to linguistic categories. The results suggest that the style of German literary studies is characterized by nominal structures and the style of linguistics by verbal ones.</abstract>
<identifier type="citekey">andresen-zinsmeister-2017-approximating</identifier>
<identifier type="doi">10.18653/v1/W17-4913</identifier>
<location>
<url>https://aclanthology.org/W17-4913</url>
</location>
<part>
<date>2017-09</date>
<extent unit="page">
<start>105</start>
<end>115</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Approximating Style by N-gram-based Annotation
%A Andresen, Melanie
%A Zinsmeister, Heike
%Y Brooke, Julian
%Y Solorio, Thamar
%Y Koppel, Moshe
%S Proceedings of the Workshop on Stylistic Variation
%D 2017
%8 September
%I Association for Computational Linguistics
%C Copenhagen, Denmark
%F andresen-zinsmeister-2017-approximating
%X The concept of style is much debated in theoretical as well as empirical terms. From an empirical perspective, the key question is how to operationalize style and thus make it accessible for annotation and quantification. In authorship attribution, many different approaches have successfully resolved this issue at the cost of linguistic interpretability: The resulting algorithms may be able to distinguish one language variety from the other, but do not give us much information on their distinctive linguistic properties. We approach the issue of interpreting stylistic features by extracting linear and syntactic n-grams that are distinctive for a language variety. We present a study that exemplifies this process by a comparison of the German academic languages of linguistics and literary studies. Overall, our findings show that distinctive n-grams can be related to linguistic categories. The results suggest that the style of German literary studies is characterized by nominal structures and the style of linguistics by verbal ones.
%R 10.18653/v1/W17-4913
%U https://aclanthology.org/W17-4913
%U https://doi.org/10.18653/v1/W17-4913
%P 105-115
Markdown (Informal)
[Approximating Style by N-gram-based Annotation](https://aclanthology.org/W17-4913) (Andresen & Zinsmeister, Style-Var 2017)
ACL