@inproceedings{yuan-etal-2023-ambicoref,
title = "{A}mbi{C}oref: Evaluating Human and Model Sensitivity to Ambiguous Coreference",
author = "Yuan, Yuewei and
Malaviya, Chaitanya and
Yatskar, Mark",
editor = "Vlachos, Andreas and
Augenstein, Isabelle",
booktitle = "Findings of the Association for Computational Linguistics: EACL 2023",
month = may,
year = "2023",
address = "Dubrovnik, Croatia",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.findings-eacl.75",
doi = "10.18653/v1/2023.findings-eacl.75",
pages = "1023--1030",
abstract = "Given a sentence {``}Abby told Brittney that she upset Courtney{''}, one would struggle to understand who {``}she{''} refers to, and ask for clarification. However, if the word {``}upset{''} were replaced with {``}hugged{''}, {``}she{''} unambiguously refers to Abby. We study if modern coreference resolution models are sensitive to such pronominal ambiguity. To this end, we construct AmbiCoref, a diagnostic corpus of minimal sentence pairs with ambiguous and unambiguous referents. Our examples generalize psycholinguistic studies of human perception of ambiguity around particular arrangements of verbs and their arguments. Analysis shows that (1) humans are less sure of referents in ambiguous AmbiCoref examples than unambiguous ones, and (2) most coreference models show little difference in output between ambiguous and unambiguous pairs. We release AmbiCoref as a diagnostic corpus for testing whether models treat ambiguity similarly to humans.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="yuan-etal-2023-ambicoref">
<titleInfo>
<title>AmbiCoref: Evaluating Human and Model Sensitivity to Ambiguous Coreference</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yuewei</namePart>
<namePart type="family">Yuan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chaitanya</namePart>
<namePart type="family">Malaviya</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mark</namePart>
<namePart type="family">Yatskar</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2023-05</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Findings of the Association for Computational Linguistics: EACL 2023</title>
</titleInfo>
<name type="personal">
<namePart type="given">Andreas</namePart>
<namePart type="family">Vlachos</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Isabelle</namePart>
<namePart type="family">Augenstein</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Dubrovnik, Croatia</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Given a sentence “Abby told Brittney that she upset Courtney”, one would struggle to understand who “she” refers to, and ask for clarification. However, if the word “upset” were replaced with “hugged”, “she” unambiguously refers to Abby. We study if modern coreference resolution models are sensitive to such pronominal ambiguity. To this end, we construct AmbiCoref, a diagnostic corpus of minimal sentence pairs with ambiguous and unambiguous referents. Our examples generalize psycholinguistic studies of human perception of ambiguity around particular arrangements of verbs and their arguments. Analysis shows that (1) humans are less sure of referents in ambiguous AmbiCoref examples than unambiguous ones, and (2) most coreference models show little difference in output between ambiguous and unambiguous pairs. We release AmbiCoref as a diagnostic corpus for testing whether models treat ambiguity similarly to humans.</abstract>
<identifier type="citekey">yuan-etal-2023-ambicoref</identifier>
<identifier type="doi">10.18653/v1/2023.findings-eacl.75</identifier>
<location>
<url>https://aclanthology.org/2023.findings-eacl.75</url>
</location>
<part>
<date>2023-05</date>
<extent unit="page">
<start>1023</start>
<end>1030</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T AmbiCoref: Evaluating Human and Model Sensitivity to Ambiguous Coreference
%A Yuan, Yuewei
%A Malaviya, Chaitanya
%A Yatskar, Mark
%Y Vlachos, Andreas
%Y Augenstein, Isabelle
%S Findings of the Association for Computational Linguistics: EACL 2023
%D 2023
%8 May
%I Association for Computational Linguistics
%C Dubrovnik, Croatia
%F yuan-etal-2023-ambicoref
%X Given a sentence “Abby told Brittney that she upset Courtney”, one would struggle to understand who “she” refers to, and ask for clarification. However, if the word “upset” were replaced with “hugged”, “she” unambiguously refers to Abby. We study if modern coreference resolution models are sensitive to such pronominal ambiguity. To this end, we construct AmbiCoref, a diagnostic corpus of minimal sentence pairs with ambiguous and unambiguous referents. Our examples generalize psycholinguistic studies of human perception of ambiguity around particular arrangements of verbs and their arguments. Analysis shows that (1) humans are less sure of referents in ambiguous AmbiCoref examples than unambiguous ones, and (2) most coreference models show little difference in output between ambiguous and unambiguous pairs. We release AmbiCoref as a diagnostic corpus for testing whether models treat ambiguity similarly to humans.
%R 10.18653/v1/2023.findings-eacl.75
%U https://aclanthology.org/2023.findings-eacl.75
%U https://doi.org/10.18653/v1/2023.findings-eacl.75
%P 1023-1030
Markdown (Informal)
[AmbiCoref: Evaluating Human and Model Sensitivity to Ambiguous Coreference](https://aclanthology.org/2023.findings-eacl.75) (Yuan et al., Findings 2023)
ACL