@inproceedings{karpinska-etal-2018-subcharacter,
title = "Subcharacter Information in {J}apanese Embeddings: When Is It Worth It?",
author = "Karpinska, Marzena and
Li, Bofang and
Rogers, Anna and
Drozd, Aleksandr",
editor = "Dinu, Georgiana and
Ballesteros, Miguel and
Sil, Avirup and
Bowman, Sam and
Hamza, Wael and
Sogaard, Anders and
Naseem, Tahira and
Goldberg, Yoav",
booktitle = "Proceedings of the Workshop on the Relevance of Linguistic Structure in Neural Architectures for {NLP}",
month = jul,
year = "2018",
address = "Melbourne, Australia",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W18-2905",
doi = "10.18653/v1/W18-2905",
pages = "28--37",
abstract = "Languages with logographic writing systems present a difficulty for traditional character-level models. Leveraging the subcharacter information was recently shown to be beneficial for a number of intrinsic and extrinsic tasks in Chinese. We examine whether the same strategies could be applied for Japanese, and contribute a new analogy dataset for this language.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="karpinska-etal-2018-subcharacter">
<titleInfo>
<title>Subcharacter Information in Japanese Embeddings: When Is It Worth It?</title>
</titleInfo>
<name type="personal">
<namePart type="given">Marzena</namePart>
<namePart type="family">Karpinska</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Bofang</namePart>
<namePart type="family">Li</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Anna</namePart>
<namePart type="family">Rogers</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Aleksandr</namePart>
<namePart type="family">Drozd</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2018-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Workshop on the Relevance of Linguistic Structure in Neural Architectures for NLP</title>
</titleInfo>
<name type="personal">
<namePart type="given">Georgiana</namePart>
<namePart type="family">Dinu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Miguel</namePart>
<namePart type="family">Ballesteros</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Avirup</namePart>
<namePart type="family">Sil</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Sam</namePart>
<namePart type="family">Bowman</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Wael</namePart>
<namePart type="family">Hamza</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Anders</namePart>
<namePart type="family">Sogaard</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tahira</namePart>
<namePart type="family">Naseem</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Yoav</namePart>
<namePart type="family">Goldberg</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Melbourne, Australia</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Languages with logographic writing systems present a difficulty for traditional character-level models. Leveraging the subcharacter information was recently shown to be beneficial for a number of intrinsic and extrinsic tasks in Chinese. We examine whether the same strategies could be applied for Japanese, and contribute a new analogy dataset for this language.</abstract>
<identifier type="citekey">karpinska-etal-2018-subcharacter</identifier>
<identifier type="doi">10.18653/v1/W18-2905</identifier>
<location>
<url>https://aclanthology.org/W18-2905</url>
</location>
<part>
<date>2018-07</date>
<extent unit="page">
<start>28</start>
<end>37</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Subcharacter Information in Japanese Embeddings: When Is It Worth It?
%A Karpinska, Marzena
%A Li, Bofang
%A Rogers, Anna
%A Drozd, Aleksandr
%Y Dinu, Georgiana
%Y Ballesteros, Miguel
%Y Sil, Avirup
%Y Bowman, Sam
%Y Hamza, Wael
%Y Sogaard, Anders
%Y Naseem, Tahira
%Y Goldberg, Yoav
%S Proceedings of the Workshop on the Relevance of Linguistic Structure in Neural Architectures for NLP
%D 2018
%8 July
%I Association for Computational Linguistics
%C Melbourne, Australia
%F karpinska-etal-2018-subcharacter
%X Languages with logographic writing systems present a difficulty for traditional character-level models. Leveraging the subcharacter information was recently shown to be beneficial for a number of intrinsic and extrinsic tasks in Chinese. We examine whether the same strategies could be applied for Japanese, and contribute a new analogy dataset for this language.
%R 10.18653/v1/W18-2905
%U https://aclanthology.org/W18-2905
%U https://doi.org/10.18653/v1/W18-2905
%P 28-37
Markdown (Informal)
[Subcharacter Information in Japanese Embeddings: When Is It Worth It?](https://aclanthology.org/W18-2905) (Karpinska et al., ACL 2018)
ACL