@inproceedings{tham-2020-nlp,
title = "{NLP} Tools for {K}hasi, a low resource language",
author = "Tham, Medari",
editor = "Goyal, Vishal and
Ekbal, Asif",
booktitle = "Proceedings of the 17th International Conference on Natural Language Processing (ICON): System Demonstrations",
month = dec,
year = "2020",
address = "Patna, India",
publisher = "NLP Association of India (NLPAI)",
url = "https://aclanthology.org/2020.icon-demos.10",
pages = "26--27",
abstract = "Khasi is an Austro Asiatic language spoken by one of the tribes in Meghalaya, and parts of Assam and Bangladesh. The fact that some NLP tools for Khasi are now available online for testing purposes is the culmination of the arduous investment in time and effort. Initially when work for Khasi was initiated, resources for Khasi, such as tagset and annotated corpus or any NLP tools, were nonexistent. As part of the author{'}s ongoing work for her doctoral program, currently, the resources for Khasi that are in place are the BIS (Bureau of Indian Standards) tagset for Khasi, a 90k annotated corpus, and NLP tools such as POS (parts of speech) taggers and shallow parsers. These mentioned tools are highlighted in this demonstration paper.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="tham-2020-nlp">
<titleInfo>
<title>NLP Tools for Khasi, a low resource language</title>
</titleInfo>
<name type="personal">
<namePart type="given">Medari</namePart>
<namePart type="family">Tham</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2020-12</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 17th International Conference on Natural Language Processing (ICON): System Demonstrations</title>
</titleInfo>
<name type="personal">
<namePart type="given">Vishal</namePart>
<namePart type="family">Goyal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Asif</namePart>
<namePart type="family">Ekbal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>NLP Association of India (NLPAI)</publisher>
<place>
<placeTerm type="text">Patna, India</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Khasi is an Austro Asiatic language spoken by one of the tribes in Meghalaya, and parts of Assam and Bangladesh. The fact that some NLP tools for Khasi are now available online for testing purposes is the culmination of the arduous investment in time and effort. Initially when work for Khasi was initiated, resources for Khasi, such as tagset and annotated corpus or any NLP tools, were nonexistent. As part of the author’s ongoing work for her doctoral program, currently, the resources for Khasi that are in place are the BIS (Bureau of Indian Standards) tagset for Khasi, a 90k annotated corpus, and NLP tools such as POS (parts of speech) taggers and shallow parsers. These mentioned tools are highlighted in this demonstration paper.</abstract>
<identifier type="citekey">tham-2020-nlp</identifier>
<location>
<url>https://aclanthology.org/2020.icon-demos.10</url>
</location>
<part>
<date>2020-12</date>
<extent unit="page">
<start>26</start>
<end>27</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T NLP Tools for Khasi, a low resource language
%A Tham, Medari
%Y Goyal, Vishal
%Y Ekbal, Asif
%S Proceedings of the 17th International Conference on Natural Language Processing (ICON): System Demonstrations
%D 2020
%8 December
%I NLP Association of India (NLPAI)
%C Patna, India
%F tham-2020-nlp
%X Khasi is an Austro Asiatic language spoken by one of the tribes in Meghalaya, and parts of Assam and Bangladesh. The fact that some NLP tools for Khasi are now available online for testing purposes is the culmination of the arduous investment in time and effort. Initially when work for Khasi was initiated, resources for Khasi, such as tagset and annotated corpus or any NLP tools, were nonexistent. As part of the author’s ongoing work for her doctoral program, currently, the resources for Khasi that are in place are the BIS (Bureau of Indian Standards) tagset for Khasi, a 90k annotated corpus, and NLP tools such as POS (parts of speech) taggers and shallow parsers. These mentioned tools are highlighted in this demonstration paper.
%U https://aclanthology.org/2020.icon-demos.10
%P 26-27
Markdown (Informal)
[NLP Tools for Khasi, a low resource language](https://aclanthology.org/2020.icon-demos.10) (Tham, ICON 2020)
ACL
- Medari Tham. 2020. NLP Tools for Khasi, a low resource language. In Proceedings of the 17th International Conference on Natural Language Processing (ICON): System Demonstrations, pages 26–27, Patna, India. NLP Association of India (NLPAI).