@inproceedings{zeldes-2018-characterwise,
title = "A Characterwise Windowed Approach to {H}ebrew Morphological Segmentation",
author = "Zeldes, Amir",
editor = "Kuebler, Sandra and
Nicolai, Garrett",
booktitle = "Proceedings of the Fifteenth Workshop on Computational Research in Phonetics, Phonology, and Morphology",
month = oct,
year = "2018",
address = "Brussels, Belgium",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W18-5811",
doi = "10.18653/v1/W18-5811",
pages = "101--110",
abstract = "This paper presents a novel approach to the segmentation of orthographic word forms in contemporary Hebrew, focusing purely on splitting without carrying out morphological analysis or disambiguation. Casting the analysis task as character-wise binary classification and using adjacent character and word-based lexicon-lookup features, this approach achieves over 98{\%} accuracy on the benchmark SPMRL shared task data for Hebrew, and 97{\%} accuracy on a new out of domain Wikipedia dataset, an improvement of {\mbox{$\approx$}}4{\%} and 5{\%} over previous state of the art performance.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="zeldes-2018-characterwise">
<titleInfo>
<title>A Characterwise Windowed Approach to Hebrew Morphological Segmentation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Amir</namePart>
<namePart type="family">Zeldes</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2018-10</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Fifteenth Workshop on Computational Research in Phonetics, Phonology, and Morphology</title>
</titleInfo>
<name type="personal">
<namePart type="given">Sandra</namePart>
<namePart type="family">Kuebler</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Garrett</namePart>
<namePart type="family">Nicolai</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Brussels, Belgium</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper presents a novel approach to the segmentation of orthographic word forms in contemporary Hebrew, focusing purely on splitting without carrying out morphological analysis or disambiguation. Casting the analysis task as character-wise binary classification and using adjacent character and word-based lexicon-lookup features, this approach achieves over 98% accuracy on the benchmark SPMRL shared task data for Hebrew, and 97% accuracy on a new out of domain Wikipedia dataset, an improvement of \approx4% and 5% over previous state of the art performance.</abstract>
<identifier type="citekey">zeldes-2018-characterwise</identifier>
<identifier type="doi">10.18653/v1/W18-5811</identifier>
<location>
<url>https://aclanthology.org/W18-5811</url>
</location>
<part>
<date>2018-10</date>
<extent unit="page">
<start>101</start>
<end>110</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T A Characterwise Windowed Approach to Hebrew Morphological Segmentation
%A Zeldes, Amir
%Y Kuebler, Sandra
%Y Nicolai, Garrett
%S Proceedings of the Fifteenth Workshop on Computational Research in Phonetics, Phonology, and Morphology
%D 2018
%8 October
%I Association for Computational Linguistics
%C Brussels, Belgium
%F zeldes-2018-characterwise
%X This paper presents a novel approach to the segmentation of orthographic word forms in contemporary Hebrew, focusing purely on splitting without carrying out morphological analysis or disambiguation. Casting the analysis task as character-wise binary classification and using adjacent character and word-based lexicon-lookup features, this approach achieves over 98% accuracy on the benchmark SPMRL shared task data for Hebrew, and 97% accuracy on a new out of domain Wikipedia dataset, an improvement of \approx4% and 5% over previous state of the art performance.
%R 10.18653/v1/W18-5811
%U https://aclanthology.org/W18-5811
%U https://doi.org/10.18653/v1/W18-5811
%P 101-110
Markdown (Informal)
[A Characterwise Windowed Approach to Hebrew Morphological Segmentation](https://aclanthology.org/W18-5811) (Zeldes, EMNLP 2018)
ACL