@inproceedings{steiner-2019-augmenting,
title = "Augmenting a {G}erman Morphological Database by Data-Intense Methods",
author = "Steiner, Petra",
editor = "Nicolai, Garrett and
Cotterell, Ryan",
booktitle = "Proceedings of the 16th Workshop on Computational Research in Phonetics, Phonology, and Morphology",
month = aug,
year = "2019",
address = "Florence, Italy",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W19-4221",
doi = "10.18653/v1/W19-4221",
pages = "178--188",
abstract = "This paper deals with the automatic enhancement of a new German morphological database. While there are some databases for flat word segmentation, this is the first available resource which can be directly used for deep parsing of German words. We combine the entries of this morphological database with the morphological tools SMOR and Moremorph and a context-based evaluation method which builds on a large Wikipedia corpus. We describe the state of the art and the essential characteristics of the database and the context method. The approach is tested on an inflight magazine of Lufthansa. We derive over 5,000 new instances of complex words. The coverage for the lemma types reaches up to over 99 percent. The precision of new found complex splits and monomorphemes is between 0.93 and 0.99.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="steiner-2019-augmenting">
<titleInfo>
<title>Augmenting a German Morphological Database by Data-Intense Methods</title>
</titleInfo>
<name type="personal">
<namePart type="given">Petra</namePart>
<namePart type="family">Steiner</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-08</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 16th Workshop on Computational Research in Phonetics, Phonology, and Morphology</title>
</titleInfo>
<name type="personal">
<namePart type="given">Garrett</namePart>
<namePart type="family">Nicolai</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ryan</namePart>
<namePart type="family">Cotterell</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Florence, Italy</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper deals with the automatic enhancement of a new German morphological database. While there are some databases for flat word segmentation, this is the first available resource which can be directly used for deep parsing of German words. We combine the entries of this morphological database with the morphological tools SMOR and Moremorph and a context-based evaluation method which builds on a large Wikipedia corpus. We describe the state of the art and the essential characteristics of the database and the context method. The approach is tested on an inflight magazine of Lufthansa. We derive over 5,000 new instances of complex words. The coverage for the lemma types reaches up to over 99 percent. The precision of new found complex splits and monomorphemes is between 0.93 and 0.99.</abstract>
<identifier type="citekey">steiner-2019-augmenting</identifier>
<identifier type="doi">10.18653/v1/W19-4221</identifier>
<location>
<url>https://aclanthology.org/W19-4221</url>
</location>
<part>
<date>2019-08</date>
<extent unit="page">
<start>178</start>
<end>188</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Augmenting a German Morphological Database by Data-Intense Methods
%A Steiner, Petra
%Y Nicolai, Garrett
%Y Cotterell, Ryan
%S Proceedings of the 16th Workshop on Computational Research in Phonetics, Phonology, and Morphology
%D 2019
%8 August
%I Association for Computational Linguistics
%C Florence, Italy
%F steiner-2019-augmenting
%X This paper deals with the automatic enhancement of a new German morphological database. While there are some databases for flat word segmentation, this is the first available resource which can be directly used for deep parsing of German words. We combine the entries of this morphological database with the morphological tools SMOR and Moremorph and a context-based evaluation method which builds on a large Wikipedia corpus. We describe the state of the art and the essential characteristics of the database and the context method. The approach is tested on an inflight magazine of Lufthansa. We derive over 5,000 new instances of complex words. The coverage for the lemma types reaches up to over 99 percent. The precision of new found complex splits and monomorphemes is between 0.93 and 0.99.
%R 10.18653/v1/W19-4221
%U https://aclanthology.org/W19-4221
%U https://doi.org/10.18653/v1/W19-4221
%P 178-188
Markdown (Informal)
[Augmenting a German Morphological Database by Data-Intense Methods](https://aclanthology.org/W19-4221) (Steiner, ACL 2019)
ACL