@inproceedings{wang-keuleers-2024-simplified,
title = "Simplified {C}hinese Character Distance Based on Ideographic Description Sequences",
author = "Wang, Yixia and
Keuleers, Emmanuel",
editor = "Gorman, Kyle and
Prud'hommeaux, Emily and
Roark, Brian and
Sproat, Richard",
booktitle = "Proceedings of the Second Workshop on Computation and Written Language (CAWL) @ LREC-COLING 2024",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://aclanthology.org/2024.cawl-1.8",
pages = "59--66",
abstract = "Character encoding systems have long overlooked the internal structure of characters. Ideographic Description Sequences, which explicitly represent spatial relations between character components, are a potential solution to this problem. In this paper, we illustrate the utility of Ideographic Description Sequences in computing edit distance and finding orthographic neighbors for Simplified Chinese characters. In addition, we explore the possibility of using Ideographic Description Sequences to encode spatial relations between components in other scripts.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="wang-keuleers-2024-simplified">
<titleInfo>
<title>Simplified Chinese Character Distance Based on Ideographic Description Sequences</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yixia</namePart>
<namePart type="family">Wang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Emmanuel</namePart>
<namePart type="family">Keuleers</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2024-05</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Second Workshop on Computation and Written Language (CAWL) @ LREC-COLING 2024</title>
</titleInfo>
<name type="personal">
<namePart type="given">Kyle</namePart>
<namePart type="family">Gorman</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Emily</namePart>
<namePart type="family">Prud’hommeaux</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Brian</namePart>
<namePart type="family">Roark</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Richard</namePart>
<namePart type="family">Sproat</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>ELRA and ICCL</publisher>
<place>
<placeTerm type="text">Torino, Italia</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Character encoding systems have long overlooked the internal structure of characters. Ideographic Description Sequences, which explicitly represent spatial relations between character components, are a potential solution to this problem. In this paper, we illustrate the utility of Ideographic Description Sequences in computing edit distance and finding orthographic neighbors for Simplified Chinese characters. In addition, we explore the possibility of using Ideographic Description Sequences to encode spatial relations between components in other scripts.</abstract>
<identifier type="citekey">wang-keuleers-2024-simplified</identifier>
<location>
<url>https://aclanthology.org/2024.cawl-1.8</url>
</location>
<part>
<date>2024-05</date>
<extent unit="page">
<start>59</start>
<end>66</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Simplified Chinese Character Distance Based on Ideographic Description Sequences
%A Wang, Yixia
%A Keuleers, Emmanuel
%Y Gorman, Kyle
%Y Prud’hommeaux, Emily
%Y Roark, Brian
%Y Sproat, Richard
%S Proceedings of the Second Workshop on Computation and Written Language (CAWL) @ LREC-COLING 2024
%D 2024
%8 May
%I ELRA and ICCL
%C Torino, Italia
%F wang-keuleers-2024-simplified
%X Character encoding systems have long overlooked the internal structure of characters. Ideographic Description Sequences, which explicitly represent spatial relations between character components, are a potential solution to this problem. In this paper, we illustrate the utility of Ideographic Description Sequences in computing edit distance and finding orthographic neighbors for Simplified Chinese characters. In addition, we explore the possibility of using Ideographic Description Sequences to encode spatial relations between components in other scripts.
%U https://aclanthology.org/2024.cawl-1.8
%P 59-66
Markdown (Informal)
[Simplified Chinese Character Distance Based on Ideographic Description Sequences](https://aclanthology.org/2024.cawl-1.8) (Wang & Keuleers, CAWL-WS 2024)
ACL