@inproceedings{wang-shih-2018-hybrid,
title = "A Hybrid Approach Combining Statistical Knowledge with Conditional Random Fields for {C}hinese Grammatical Error Detection",
author = "Wang, Yiyi and
Shih, Chilin",
editor = "Tseng, Yuen-Hsien and
Chen, Hsin-Hsi and
Ng, Vincent and
Komachi, Mamoru",
booktitle = "Proceedings of the 5th Workshop on Natural Language Processing Techniques for Educational Applications",
month = jul,
year = "2018",
address = "Melbourne, Australia",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W18-3728",
doi = "10.18653/v1/W18-3728",
pages = "194--198",
abstract = "This paper presents a method of combining Conditional Random Fields (CRFs) model with a post-processing layer using Google n-grams statistical information tailored to detect word selection and word order errors made by learners of Chinese as Foreign Language (CFL). We describe the architecture of the model and its performance in the shared task of the ACL 2018 Workshop on Natural Language Processing Techniques for Educational Applications (NLPTEA). This hybrid approach yields comparably high false positive rate (FPR = 0.1274) and precision (Pd= 0.7519; Pi= 0.6311), but low recall (Rd = 0.3035; Ri = 0.1696 ) in grammatical error detection and identification tasks. Additional statistical information and linguistic rules can be added to enhance the model performance in the future.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="wang-shih-2018-hybrid">
<titleInfo>
<title>A Hybrid Approach Combining Statistical Knowledge with Conditional Random Fields for Chinese Grammatical Error Detection</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yiyi</namePart>
<namePart type="family">Wang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chilin</namePart>
<namePart type="family">Shih</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2018-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 5th Workshop on Natural Language Processing Techniques for Educational Applications</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yuen-Hsien</namePart>
<namePart type="family">Tseng</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hsin-Hsi</namePart>
<namePart type="family">Chen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Vincent</namePart>
<namePart type="family">Ng</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mamoru</namePart>
<namePart type="family">Komachi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Melbourne, Australia</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper presents a method of combining Conditional Random Fields (CRFs) model with a post-processing layer using Google n-grams statistical information tailored to detect word selection and word order errors made by learners of Chinese as Foreign Language (CFL). We describe the architecture of the model and its performance in the shared task of the ACL 2018 Workshop on Natural Language Processing Techniques for Educational Applications (NLPTEA). This hybrid approach yields comparably high false positive rate (FPR = 0.1274) and precision (Pd= 0.7519; Pi= 0.6311), but low recall (Rd = 0.3035; Ri = 0.1696 ) in grammatical error detection and identification tasks. Additional statistical information and linguistic rules can be added to enhance the model performance in the future.</abstract>
<identifier type="citekey">wang-shih-2018-hybrid</identifier>
<identifier type="doi">10.18653/v1/W18-3728</identifier>
<location>
<url>https://aclanthology.org/W18-3728</url>
</location>
<part>
<date>2018-07</date>
<extent unit="page">
<start>194</start>
<end>198</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T A Hybrid Approach Combining Statistical Knowledge with Conditional Random Fields for Chinese Grammatical Error Detection
%A Wang, Yiyi
%A Shih, Chilin
%Y Tseng, Yuen-Hsien
%Y Chen, Hsin-Hsi
%Y Ng, Vincent
%Y Komachi, Mamoru
%S Proceedings of the 5th Workshop on Natural Language Processing Techniques for Educational Applications
%D 2018
%8 July
%I Association for Computational Linguistics
%C Melbourne, Australia
%F wang-shih-2018-hybrid
%X This paper presents a method of combining Conditional Random Fields (CRFs) model with a post-processing layer using Google n-grams statistical information tailored to detect word selection and word order errors made by learners of Chinese as Foreign Language (CFL). We describe the architecture of the model and its performance in the shared task of the ACL 2018 Workshop on Natural Language Processing Techniques for Educational Applications (NLPTEA). This hybrid approach yields comparably high false positive rate (FPR = 0.1274) and precision (Pd= 0.7519; Pi= 0.6311), but low recall (Rd = 0.3035; Ri = 0.1696 ) in grammatical error detection and identification tasks. Additional statistical information and linguistic rules can be added to enhance the model performance in the future.
%R 10.18653/v1/W18-3728
%U https://aclanthology.org/W18-3728
%U https://doi.org/10.18653/v1/W18-3728
%P 194-198
Markdown (Informal)
[A Hybrid Approach Combining Statistical Knowledge with Conditional Random Fields for Chinese Grammatical Error Detection](https://aclanthology.org/W18-3728) (Wang & Shih, NLP-TEA 2018)
ACL