@inproceedings{itai-segal-2003-corpus,
title = "A corpus based morphological analyzer for unvocalized modern {H}ebrew",
author = "Itai, Alon and
Segal, Erel",
booktitle = "Workshop on Machine Translation for Semitic languages: issues and approaches",
month = sep # " 23-27",
year = "2003",
address = "New Orleans, USA",
url = "https://aclanthology.org/2003.mtsummit-semit.9",
abstract = "Most words in Modern Hebrew texts are morphologically ambiguous. We describe a method for finding the correct morphological analysis of each word in a Modern Hebrew text. The program first uses a small tagged corpus to estimate the probability of each possible analysis of each word regardless of its context and chooses the most probable analysis. It then applies automatically learned rules to correct the analysis of each word according to its neighbors. Finally, it uses a simple syntactical analyzer to further correct the analysis, thus combining statistical methods with rule-based syntactic analysis. It is shown that this combination greatly improves the accuracy of the morphological analysis{---}achieving up to 96.2{\%} accuracy.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="itai-segal-2003-corpus">
<titleInfo>
<title>A corpus based morphological analyzer for unvocalized modern Hebrew</title>
</titleInfo>
<name type="personal">
<namePart type="given">Alon</namePart>
<namePart type="family">Itai</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Erel</namePart>
<namePart type="family">Segal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2003-sep 23-27</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Workshop on Machine Translation for Semitic languages: issues and approaches</title>
</titleInfo>
<originInfo>
<place>
<placeTerm type="text">New Orleans, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Most words in Modern Hebrew texts are morphologically ambiguous. We describe a method for finding the correct morphological analysis of each word in a Modern Hebrew text. The program first uses a small tagged corpus to estimate the probability of each possible analysis of each word regardless of its context and chooses the most probable analysis. It then applies automatically learned rules to correct the analysis of each word according to its neighbors. Finally, it uses a simple syntactical analyzer to further correct the analysis, thus combining statistical methods with rule-based syntactic analysis. It is shown that this combination greatly improves the accuracy of the morphological analysis—achieving up to 96.2% accuracy.</abstract>
<identifier type="citekey">itai-segal-2003-corpus</identifier>
<location>
<url>https://aclanthology.org/2003.mtsummit-semit.9</url>
</location>
<part>
<date>2003-sep 23-27</date>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T A corpus based morphological analyzer for unvocalized modern Hebrew
%A Itai, Alon
%A Segal, Erel
%S Workshop on Machine Translation for Semitic languages: issues and approaches
%D 2003
%8 sep 23 27
%C New Orleans, USA
%F itai-segal-2003-corpus
%X Most words in Modern Hebrew texts are morphologically ambiguous. We describe a method for finding the correct morphological analysis of each word in a Modern Hebrew text. The program first uses a small tagged corpus to estimate the probability of each possible analysis of each word regardless of its context and chooses the most probable analysis. It then applies automatically learned rules to correct the analysis of each word according to its neighbors. Finally, it uses a simple syntactical analyzer to further correct the analysis, thus combining statistical methods with rule-based syntactic analysis. It is shown that this combination greatly improves the accuracy of the morphological analysis—achieving up to 96.2% accuracy.
%U https://aclanthology.org/2003.mtsummit-semit.9
Markdown (Informal)
[A corpus based morphological analyzer for unvocalized modern Hebrew](https://aclanthology.org/2003.mtsummit-semit.9) (Itai & Segal, MTSummit 2003)
ACL