@inproceedings{L16-1565,
 abstract = {We present NorGramBank, a treebank for Norwegian with highly detailed LFG analyses. It is one of many treebanks made available through the INESS treebanking infrastructure. NorGramBank was constructed as a parsebank, i.e. by automatically parsing a corpus, using the wide coverage grammar NorGram. One part consisting of 350,000 words has been manually disambiguated using computer-generated discriminants. A larger part of 50 M words has been stochastically disambiguated. The treebank is dynamic: by global reparsing at certain intervals it is kept compatible with the latest versions of the grammar and the lexicon, which are continually further developed in interaction with the annotators. A powerful query language, INESS Search, has been developed for search across formalisms in the INESS treebanks, including LFG c- and f-structures. Evaluation shows that the grammar provides about 85\% of randomly selected sentences with good analyses. Agreement among the annotators responsible for manual disambiguation is satisfactory, but also suggests desirable simplifications of the grammar.
},
 address = {Portorož, Slovenia},
 author = {Helge Dyvik and Paul Meurer and Victoria Rosén and Koenraad De Smedt and Petter Haugereid and Gyri Smørdal Losnegaard and Gunn Inger Lyse and Martha Thunes},
 booktitle = {Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
 month = {May},
 pages = {3555--3562},
 publisher = {European Language Resources Association (ELRA)},
 title = {NorGramBank: A ‘Deep’ Treebank for Norwegian},
 url = {https://www.aclweb.org/anthology/L16-1565},
 year = {2016}
}

