@inproceedings{thorsteinsson-etal-2019-wide,
title = "A Wide-Coverage Context-Free Grammar for {I}celandic and an Accompanying Parsing System",
author = "{\TH}orsteinsson, Vilhj{\'a}lmur and
{\'O}lad{\'o}ttir, Hulda and
Loftsson, Hrafn",
editor = "Mitkov, Ruslan and
Angelova, Galia",
booktitle = "Proceedings of the International Conference on Recent Advances in Natural Language Processing (RANLP 2019)",
month = sep,
year = "2019",
address = "Varna, Bulgaria",
publisher = "INCOMA Ltd.",
url = "https://aclanthology.org/R19-1160",
doi = "10.26615/978-954-452-056-4_160",
pages = "1397--1404",
abstract = "We present an open-source, wide-coverage context-free grammar (CFG) for Icelandic, and an accompanying parsing system. The grammar has over 5,600 nonterminals, 4,600 terminals and 19,000 productions in fully expanded form, with feature agreement constraints for case, gender, number and person. The parsing system consists of an enhanced Earley-based parser and a mechanism to select best-scoring parse trees from shared packed parse forests. Our parsing system is able to parse about 90{\%} of all sentences in articles published on the main Icelandic news websites. Preliminary evaluation with evalb shows an F-measure of 70.72{\%} on parsed sentences. Our system demonstrates that parsing a morphologically rich language using a wide-coverage CFG can be practical.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="thorsteinsson-etal-2019-wide">
<titleInfo>
<title>A Wide-Coverage Context-Free Grammar for Icelandic and an Accompanying Parsing System</title>
</titleInfo>
<name type="personal">
<namePart type="given">Vilhjálmur</namePart>
<namePart type="family">\THorsteinsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hulda</namePart>
<namePart type="family">Óladóttir</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hrafn</namePart>
<namePart type="family">Loftsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-09</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the International Conference on Recent Advances in Natural Language Processing (RANLP 2019)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Ruslan</namePart>
<namePart type="family">Mitkov</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Galia</namePart>
<namePart type="family">Angelova</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>INCOMA Ltd.</publisher>
<place>
<placeTerm type="text">Varna, Bulgaria</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We present an open-source, wide-coverage context-free grammar (CFG) for Icelandic, and an accompanying parsing system. The grammar has over 5,600 nonterminals, 4,600 terminals and 19,000 productions in fully expanded form, with feature agreement constraints for case, gender, number and person. The parsing system consists of an enhanced Earley-based parser and a mechanism to select best-scoring parse trees from shared packed parse forests. Our parsing system is able to parse about 90% of all sentences in articles published on the main Icelandic news websites. Preliminary evaluation with evalb shows an F-measure of 70.72% on parsed sentences. Our system demonstrates that parsing a morphologically rich language using a wide-coverage CFG can be practical.</abstract>
<identifier type="citekey">thorsteinsson-etal-2019-wide</identifier>
<identifier type="doi">10.26615/978-954-452-056-4_160</identifier>
<location>
<url>https://aclanthology.org/R19-1160</url>
</location>
<part>
<date>2019-09</date>
<extent unit="page">
<start>1397</start>
<end>1404</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T A Wide-Coverage Context-Free Grammar for Icelandic and an Accompanying Parsing System
%A \THorsteinsson, Vilhjálmur
%A Óladóttir, Hulda
%A Loftsson, Hrafn
%Y Mitkov, Ruslan
%Y Angelova, Galia
%S Proceedings of the International Conference on Recent Advances in Natural Language Processing (RANLP 2019)
%D 2019
%8 September
%I INCOMA Ltd.
%C Varna, Bulgaria
%F thorsteinsson-etal-2019-wide
%X We present an open-source, wide-coverage context-free grammar (CFG) for Icelandic, and an accompanying parsing system. The grammar has over 5,600 nonterminals, 4,600 terminals and 19,000 productions in fully expanded form, with feature agreement constraints for case, gender, number and person. The parsing system consists of an enhanced Earley-based parser and a mechanism to select best-scoring parse trees from shared packed parse forests. Our parsing system is able to parse about 90% of all sentences in articles published on the main Icelandic news websites. Preliminary evaluation with evalb shows an F-measure of 70.72% on parsed sentences. Our system demonstrates that parsing a morphologically rich language using a wide-coverage CFG can be practical.
%R 10.26615/978-954-452-056-4_160
%U https://aclanthology.org/R19-1160
%U https://doi.org/10.26615/978-954-452-056-4_160
%P 1397-1404
Markdown (Informal)
[A Wide-Coverage Context-Free Grammar for Icelandic and an Accompanying Parsing System](https://aclanthology.org/R19-1160) (Þorsteinsson et al., RANLP 2019)
ACL