@inproceedings{pine-etal-2025-zero,
title = "Zero-Shot Query Generation for Approximate Search Algorithm Evaluation",
author = "Pine, Aidan and
Huggins-Daines, David and
Leeming, Carmen and
Littell, Patrick and
Montler, Timothy and
Souter, Heather and
Turin, Mark",
editor = "Lachler, Jordan and
Agyapong, Godfred and
Arppe, Antti and
Moeller, Sarah and
Chaudhary, Aditi and
Rijhwani, Shruti and
Rosenblum, Daisy",
booktitle = "Proceedings of the Eight Workshop on the Use of Computational Methods in the Study of Endangered Languages",
month = mar,
year = "2025",
address = "Honolulu, Hawaii, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2025.computel-main.7/",
pages = "65--73",
abstract = "Approximate search is a valuable component of online dictionaries for learners, allowing them to find words even when they have not fully mastered the orthography or cannot reliably perceive phonemic differences in the language. However, evaluating the performance of different approximate search algorithms remains difficult in the absence of real user queries. We detail several methods for generating synthetic queries representing various user personas. We then compare the performance of several search algorithms on both real and synthetic queries in two Indigenous languages, SEN{\'C}O{\={T}}EN and Michif, that are phonologically and morphologically very different from English."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="pine-etal-2025-zero">
<titleInfo>
<title>Zero-Shot Query Generation for Approximate Search Algorithm Evaluation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Aidan</namePart>
<namePart type="family">Pine</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">David</namePart>
<namePart type="family">Huggins-Daines</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Carmen</namePart>
<namePart type="family">Leeming</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Patrick</namePart>
<namePart type="family">Littell</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Timothy</namePart>
<namePart type="family">Montler</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Heather</namePart>
<namePart type="family">Souter</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mark</namePart>
<namePart type="family">Turin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2025-03</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Eight Workshop on the Use of Computational Methods in the Study of Endangered Languages</title>
</titleInfo>
<name type="personal">
<namePart type="given">Jordan</namePart>
<namePart type="family">Lachler</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Godfred</namePart>
<namePart type="family">Agyapong</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Antti</namePart>
<namePart type="family">Arppe</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Sarah</namePart>
<namePart type="family">Moeller</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Aditi</namePart>
<namePart type="family">Chaudhary</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Shruti</namePart>
<namePart type="family">Rijhwani</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Daisy</namePart>
<namePart type="family">Rosenblum</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Honolulu, Hawaii, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Approximate search is a valuable component of online dictionaries for learners, allowing them to find words even when they have not fully mastered the orthography or cannot reliably perceive phonemic differences in the language. However, evaluating the performance of different approximate search algorithms remains difficult in the absence of real user queries. We detail several methods for generating synthetic queries representing various user personas. We then compare the performance of several search algorithms on both real and synthetic queries in two Indigenous languages, SENĆO\=TEN and Michif, that are phonologically and morphologically very different from English.</abstract>
<identifier type="citekey">pine-etal-2025-zero</identifier>
<location>
<url>https://aclanthology.org/2025.computel-main.7/</url>
</location>
<part>
<date>2025-03</date>
<extent unit="page">
<start>65</start>
<end>73</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Zero-Shot Query Generation for Approximate Search Algorithm Evaluation
%A Pine, Aidan
%A Huggins-Daines, David
%A Leeming, Carmen
%A Littell, Patrick
%A Montler, Timothy
%A Souter, Heather
%A Turin, Mark
%Y Lachler, Jordan
%Y Agyapong, Godfred
%Y Arppe, Antti
%Y Moeller, Sarah
%Y Chaudhary, Aditi
%Y Rijhwani, Shruti
%Y Rosenblum, Daisy
%S Proceedings of the Eight Workshop on the Use of Computational Methods in the Study of Endangered Languages
%D 2025
%8 March
%I Association for Computational Linguistics
%C Honolulu, Hawaii, USA
%F pine-etal-2025-zero
%X Approximate search is a valuable component of online dictionaries for learners, allowing them to find words even when they have not fully mastered the orthography or cannot reliably perceive phonemic differences in the language. However, evaluating the performance of different approximate search algorithms remains difficult in the absence of real user queries. We detail several methods for generating synthetic queries representing various user personas. We then compare the performance of several search algorithms on both real and synthetic queries in two Indigenous languages, SENĆO\=TEN and Michif, that are phonologically and morphologically very different from English.
%U https://aclanthology.org/2025.computel-main.7/
%P 65-73
Markdown (Informal)
[Zero-Shot Query Generation for Approximate Search Algorithm Evaluation](https://aclanthology.org/2025.computel-main.7/) (Pine et al., ComputEL 2025)
ACL
- Aidan Pine, David Huggins-Daines, Carmen Leeming, Patrick Littell, Timothy Montler, Heather Souter, and Mark Turin. 2025. Zero-Shot Query Generation for Approximate Search Algorithm Evaluation. In Proceedings of the Eight Workshop on the Use of Computational Methods in the Study of Endangered Languages, pages 65–73, Honolulu, Hawaii, USA. Association for Computational Linguistics.