@inproceedings{rajpoot-2026-tifin,
title = "Tifin {I}ndia at {S}em{E}val-2026 Task 5: Semantic Bridge: Augmented Encoding for Word Sense Plausibility",
author = "Rajpoot, Pawan",
editor = "Kochmar, Ekaterina and
Ghosh, Debanjan and
North, Kai and
Komachi, Mamoru",
booktitle = "Proceedings of the 20th {I}nternational {W}orkshop on {S}emantic {E}valuation (2026)",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2026.semeval-1.388/",
pages = "3095--3102",
ISBN = "979-8-89176-414-9",
abstract = "We present a hybrid system for SemEval 2026Task 5: Rating Plausibility of Word Senses inAmbiguous Stories. Our approach reframesLLMs as feature generators rather than directpredictors. We combine two subsystems: onethat appends LLM-generated hints to the in-put context and trains an encoder-based regres-sion model, and another that feeds structuredhints from multiple LLM configurations into alightweight regression ensemble. We generatemultilingual enrichments to probe LLMs forcomplementary signals and take advantage ofthe fact that translation into certain languagesimplicitly disambiguates word senses, makingthe encoder more robust. The 50/50 ensem-ble achieves 859/930 (92.37{\%}) accuracy withSpearman {\ensuremath{\rho}}= 0.8384 on the test set, exceed-ing the estimated human ceiling of 89.2{\%}. Thesame LLM enrichments, processed through fun-damentally different paradigms (tabular regres-sion vs. full-text encoding), produce comple-mentary errors that cancel under ensembling.Notably, simple 50/50 averaging captures thisgain without any learned combiner, suggest-ing that"
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="rajpoot-2026-tifin">
<titleInfo>
<title>Tifin India at SemEval-2026 Task 5: Semantic Bridge: Augmented Encoding for Word Sense Plausibility</title>
</titleInfo>
<name type="personal">
<namePart type="given">Pawan</namePart>
<namePart type="family">Rajpoot</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2026-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 20th International Workshop on Semantic Evaluation (2026)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Ekaterina</namePart>
<namePart type="family">Kochmar</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Debanjan</namePart>
<namePart type="family">Ghosh</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kai</namePart>
<namePart type="family">North</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mamoru</namePart>
<namePart type="family">Komachi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">San Diego, California, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-414-9</identifier>
</relatedItem>
<abstract>We present a hybrid system for SemEval 2026Task 5: Rating Plausibility of Word Senses inAmbiguous Stories. Our approach reframesLLMs as feature generators rather than directpredictors. We combine two subsystems: onethat appends LLM-generated hints to the in-put context and trains an encoder-based regres-sion model, and another that feeds structuredhints from multiple LLM configurations into alightweight regression ensemble. We generatemultilingual enrichments to probe LLMs forcomplementary signals and take advantage ofthe fact that translation into certain languagesimplicitly disambiguates word senses, makingthe encoder more robust. The 50/50 ensem-ble achieves 859/930 (92.37%) accuracy withSpearman \ensuremathρ= 0.8384 on the test set, exceed-ing the estimated human ceiling of 89.2%. Thesame LLM enrichments, processed through fun-damentally different paradigms (tabular regres-sion vs. full-text encoding), produce comple-mentary errors that cancel under ensembling.Notably, simple 50/50 averaging captures thisgain without any learned combiner, suggest-ing that</abstract>
<identifier type="citekey">rajpoot-2026-tifin</identifier>
<location>
<url>https://aclanthology.org/2026.semeval-1.388/</url>
</location>
<part>
<date>2026-07</date>
<extent unit="page">
<start>3095</start>
<end>3102</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Tifin India at SemEval-2026 Task 5: Semantic Bridge: Augmented Encoding for Word Sense Plausibility
%A Rajpoot, Pawan
%Y Kochmar, Ekaterina
%Y Ghosh, Debanjan
%Y North, Kai
%Y Komachi, Mamoru
%S Proceedings of the 20th International Workshop on Semantic Evaluation (2026)
%D 2026
%8 July
%I Association for Computational Linguistics
%C San Diego, California, USA
%@ 979-8-89176-414-9
%F rajpoot-2026-tifin
%X We present a hybrid system for SemEval 2026Task 5: Rating Plausibility of Word Senses inAmbiguous Stories. Our approach reframesLLMs as feature generators rather than directpredictors. We combine two subsystems: onethat appends LLM-generated hints to the in-put context and trains an encoder-based regres-sion model, and another that feeds structuredhints from multiple LLM configurations into alightweight regression ensemble. We generatemultilingual enrichments to probe LLMs forcomplementary signals and take advantage ofthe fact that translation into certain languagesimplicitly disambiguates word senses, makingthe encoder more robust. The 50/50 ensem-ble achieves 859/930 (92.37%) accuracy withSpearman \ensuremathρ= 0.8384 on the test set, exceed-ing the estimated human ceiling of 89.2%. Thesame LLM enrichments, processed through fun-damentally different paradigms (tabular regres-sion vs. full-text encoding), produce comple-mentary errors that cancel under ensembling.Notably, simple 50/50 averaging captures thisgain without any learned combiner, suggest-ing that
%U https://aclanthology.org/2026.semeval-1.388/
%P 3095-3102
Markdown (Informal)
[Tifin India at SemEval-2026 Task 5: Semantic Bridge: Augmented Encoding for Word Sense Plausibility](https://aclanthology.org/2026.semeval-1.388/) (Rajpoot, SemEval 2026)
ACL