@inproceedings{yoshino-etal-2020-improving,
title = "Improving Spoken Language Understanding by Wisdom of Crowds",
author = "Yoshino, Koichiro and
Ikeuchi, Kana and
Sudoh, Katsuhito and
Nakamura, Satoshi",
editor = "Scott, Donia and
Bel, Nuria and
Zong, Chengqing",
booktitle = "Proceedings of the 28th International Conference on Computational Linguistics",
month = dec,
year = "2020",
address = "Barcelona, Spain (Online)",
publisher = "International Committee on Computational Linguistics",
url = "https://aclanthology.org/2020.coling-main.234",
doi = "10.18653/v1/2020.coling-main.234",
pages = "2606--2612",
abstract = "Spoken language understanding (SLU), which converts user requests in natural language to machine-interpretable expressions, is becoming an essential task. The lack of training data is an important problem, especially for new system tasks, because existing SLU systems are based on statistical approaches. In this paper, we proposed to use two sources of the {``}wisdom of crowds,{''} crowdsourcing and knowledge community website, for improving the SLU system. We firstly collected paraphrasing variations for new system tasks through crowdsourcing as seed data, and then augmented them using similar questions from a knowledge community website. We investigated the effects of the proposed data augmentation method in SLU task, even with small seed data. In particular, the proposed architecture augmented more than 120,000 samples to improve SLU accuracies.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="yoshino-etal-2020-improving">
<titleInfo>
<title>Improving Spoken Language Understanding by Wisdom of Crowds</title>
</titleInfo>
<name type="personal">
<namePart type="given">Koichiro</namePart>
<namePart type="family">Yoshino</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kana</namePart>
<namePart type="family">Ikeuchi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Katsuhito</namePart>
<namePart type="family">Sudoh</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Satoshi</namePart>
<namePart type="family">Nakamura</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2020-12</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 28th International Conference on Computational Linguistics</title>
</titleInfo>
<name type="personal">
<namePart type="given">Donia</namePart>
<namePart type="family">Scott</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nuria</namePart>
<namePart type="family">Bel</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chengqing</namePart>
<namePart type="family">Zong</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>International Committee on Computational Linguistics</publisher>
<place>
<placeTerm type="text">Barcelona, Spain (Online)</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Spoken language understanding (SLU), which converts user requests in natural language to machine-interpretable expressions, is becoming an essential task. The lack of training data is an important problem, especially for new system tasks, because existing SLU systems are based on statistical approaches. In this paper, we proposed to use two sources of the “wisdom of crowds,” crowdsourcing and knowledge community website, for improving the SLU system. We firstly collected paraphrasing variations for new system tasks through crowdsourcing as seed data, and then augmented them using similar questions from a knowledge community website. We investigated the effects of the proposed data augmentation method in SLU task, even with small seed data. In particular, the proposed architecture augmented more than 120,000 samples to improve SLU accuracies.</abstract>
<identifier type="citekey">yoshino-etal-2020-improving</identifier>
<identifier type="doi">10.18653/v1/2020.coling-main.234</identifier>
<location>
<url>https://aclanthology.org/2020.coling-main.234</url>
</location>
<part>
<date>2020-12</date>
<extent unit="page">
<start>2606</start>
<end>2612</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Improving Spoken Language Understanding by Wisdom of Crowds
%A Yoshino, Koichiro
%A Ikeuchi, Kana
%A Sudoh, Katsuhito
%A Nakamura, Satoshi
%Y Scott, Donia
%Y Bel, Nuria
%Y Zong, Chengqing
%S Proceedings of the 28th International Conference on Computational Linguistics
%D 2020
%8 December
%I International Committee on Computational Linguistics
%C Barcelona, Spain (Online)
%F yoshino-etal-2020-improving
%X Spoken language understanding (SLU), which converts user requests in natural language to machine-interpretable expressions, is becoming an essential task. The lack of training data is an important problem, especially for new system tasks, because existing SLU systems are based on statistical approaches. In this paper, we proposed to use two sources of the “wisdom of crowds,” crowdsourcing and knowledge community website, for improving the SLU system. We firstly collected paraphrasing variations for new system tasks through crowdsourcing as seed data, and then augmented them using similar questions from a knowledge community website. We investigated the effects of the proposed data augmentation method in SLU task, even with small seed data. In particular, the proposed architecture augmented more than 120,000 samples to improve SLU accuracies.
%R 10.18653/v1/2020.coling-main.234
%U https://aclanthology.org/2020.coling-main.234
%U https://doi.org/10.18653/v1/2020.coling-main.234
%P 2606-2612
Markdown (Informal)
[Improving Spoken Language Understanding by Wisdom of Crowds](https://aclanthology.org/2020.coling-main.234) (Yoshino et al., COLING 2020)
ACL
- Koichiro Yoshino, Kana Ikeuchi, Katsuhito Sudoh, and Satoshi Nakamura. 2020. Improving Spoken Language Understanding by Wisdom of Crowds. In Proceedings of the 28th International Conference on Computational Linguistics, pages 2606–2612, Barcelona, Spain (Online). International Committee on Computational Linguistics.