@inproceedings{nedelchev-etal-2021-proxy,
title = "Proxy Indicators for the Quality of Open-domain Dialogues",
author = "Nedelchev, Rostislav and
Lehmann, Jens and
Usbeck, Ricardo",
booktitle = "Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2021",
address = "Online and Punta Cana, Dominican Republic",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2021.emnlp-main.618",
doi = "10.18653/v1/2021.emnlp-main.618",
pages = "7834--7855",
abstract = "The automatic evaluation of open-domain dialogues remains a largely unsolved challenge. Despite the abundance of work done in the field, human judges have to evaluate dialogues{'} quality. As a consequence, performing such evaluations at scale is usually expensive. This work investigates using a deep-learning model trained on the General Language Understanding Evaluation (GLUE) benchmark to serve as a quality indication of open-domain dialogues. The aim is to use the various GLUE tasks as different perspectives on judging the quality of conversation, thus reducing the need for additional training data or responses that serve as quality references. Due to this nature, the method can infer various quality metrics and can derive a component-based overall score. We achieve statistically significant correlation coefficients of up to 0.7.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="nedelchev-etal-2021-proxy">
<titleInfo>
<title>Proxy Indicators for the Quality of Open-domain Dialogues</title>
</titleInfo>
<name type="personal">
<namePart type="given">Rostislav</namePart>
<namePart type="family">Nedelchev</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jens</namePart>
<namePart type="family">Lehmann</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ricardo</namePart>
<namePart type="family">Usbeck</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2021-11</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing</title>
</titleInfo>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Online and Punta Cana, Dominican Republic</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>The automatic evaluation of open-domain dialogues remains a largely unsolved challenge. Despite the abundance of work done in the field, human judges have to evaluate dialogues’ quality. As a consequence, performing such evaluations at scale is usually expensive. This work investigates using a deep-learning model trained on the General Language Understanding Evaluation (GLUE) benchmark to serve as a quality indication of open-domain dialogues. The aim is to use the various GLUE tasks as different perspectives on judging the quality of conversation, thus reducing the need for additional training data or responses that serve as quality references. Due to this nature, the method can infer various quality metrics and can derive a component-based overall score. We achieve statistically significant correlation coefficients of up to 0.7.</abstract>
<identifier type="citekey">nedelchev-etal-2021-proxy</identifier>
<identifier type="doi">10.18653/v1/2021.emnlp-main.618</identifier>
<location>
<url>https://aclanthology.org/2021.emnlp-main.618</url>
</location>
<part>
<date>2021-11</date>
<extent unit="page">
<start>7834</start>
<end>7855</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Proxy Indicators for the Quality of Open-domain Dialogues
%A Nedelchev, Rostislav
%A Lehmann, Jens
%A Usbeck, Ricardo
%S Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing
%D 2021
%8 November
%I Association for Computational Linguistics
%C Online and Punta Cana, Dominican Republic
%F nedelchev-etal-2021-proxy
%X The automatic evaluation of open-domain dialogues remains a largely unsolved challenge. Despite the abundance of work done in the field, human judges have to evaluate dialogues’ quality. As a consequence, performing such evaluations at scale is usually expensive. This work investigates using a deep-learning model trained on the General Language Understanding Evaluation (GLUE) benchmark to serve as a quality indication of open-domain dialogues. The aim is to use the various GLUE tasks as different perspectives on judging the quality of conversation, thus reducing the need for additional training data or responses that serve as quality references. Due to this nature, the method can infer various quality metrics and can derive a component-based overall score. We achieve statistically significant correlation coefficients of up to 0.7.
%R 10.18653/v1/2021.emnlp-main.618
%U https://aclanthology.org/2021.emnlp-main.618
%U https://doi.org/10.18653/v1/2021.emnlp-main.618
%P 7834-7855
Markdown (Informal)
[Proxy Indicators for the Quality of Open-domain Dialogues](https://aclanthology.org/2021.emnlp-main.618) (Nedelchev et al., EMNLP 2021)
ACL
- Rostislav Nedelchev, Jens Lehmann, and Ricardo Usbeck. 2021. Proxy Indicators for the Quality of Open-domain Dialogues. In Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pages 7834–7855, Online and Punta Cana, Dominican Republic. Association for Computational Linguistics.