@inproceedings{nguyen-nguyen-2026-dangnt,
title = "{DANGNT}@{SGU} at {S}em{E}val-2026 Task 1: A Two-Stage Mistral Generator with {D}istil{BERT} Reranking for {E}nglish Humor Generation",
author = "Nguyen, Tan Loc and
Nguyen, Dang Tuan",
editor = "Kochmar, Ekaterina and
Ghosh, Debanjan and
North, Kai and
Komachi, Mamoru",
booktitle = "Proceedings of the 20th {I}nternational {W}orkshop on {S}emantic {E}valuation (2026)",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2026.semeval-1.375/",
pages = "2986--2990",
ISBN = "979-8-89176-414-9",
abstract = "We describe DANGNT@SGU{'}s system for the English track of SemEval-2026 Task 1 (MWAHAHA), Subtask A (text-based humor generation). Our pipeline combines a two-stage QLoRA-adapted generator based on mistralai/Mistral-7B-Instruct-v0.2 with a DistilBERT reranker trained to distinguish jokes from non-jokes. The generator is first adapted on a raw joke corpus for general humor style, then further tuned on synthetic task-format instruction{--}response pairs for Word Inclusion and News Headlineprompts. At inference time, we generate five candidates per input, optionally enforce lexical constraints for Word Inclusion prompts, and rerank candidates with the classifier. In the official English Subtask A results, our team DANGNT@SGU obtained Elo 962 (95{\%} CI: 926{--}986), ranking 13th. The system is practical, reproducible, and based entirely on open models and public data."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="nguyen-nguyen-2026-dangnt">
<titleInfo>
<title>DANGNT@SGU at SemEval-2026 Task 1: A Two-Stage Mistral Generator with DistilBERT Reranking for English Humor Generation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Tan</namePart>
<namePart type="given">Loc</namePart>
<namePart type="family">Nguyen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Dang</namePart>
<namePart type="given">Tuan</namePart>
<namePart type="family">Nguyen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2026-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 20th International Workshop on Semantic Evaluation (2026)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Ekaterina</namePart>
<namePart type="family">Kochmar</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Debanjan</namePart>
<namePart type="family">Ghosh</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kai</namePart>
<namePart type="family">North</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mamoru</namePart>
<namePart type="family">Komachi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">San Diego, California, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-414-9</identifier>
</relatedItem>
<abstract>We describe DANGNT@SGU’s system for the English track of SemEval-2026 Task 1 (MWAHAHA), Subtask A (text-based humor generation). Our pipeline combines a two-stage QLoRA-adapted generator based on mistralai/Mistral-7B-Instruct-v0.2 with a DistilBERT reranker trained to distinguish jokes from non-jokes. The generator is first adapted on a raw joke corpus for general humor style, then further tuned on synthetic task-format instruction–response pairs for Word Inclusion and News Headlineprompts. At inference time, we generate five candidates per input, optionally enforce lexical constraints for Word Inclusion prompts, and rerank candidates with the classifier. In the official English Subtask A results, our team DANGNT@SGU obtained Elo 962 (95% CI: 926–986), ranking 13th. The system is practical, reproducible, and based entirely on open models and public data.</abstract>
<identifier type="citekey">nguyen-nguyen-2026-dangnt</identifier>
<location>
<url>https://aclanthology.org/2026.semeval-1.375/</url>
</location>
<part>
<date>2026-07</date>
<extent unit="page">
<start>2986</start>
<end>2990</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T DANGNT@SGU at SemEval-2026 Task 1: A Two-Stage Mistral Generator with DistilBERT Reranking for English Humor Generation
%A Nguyen, Tan Loc
%A Nguyen, Dang Tuan
%Y Kochmar, Ekaterina
%Y Ghosh, Debanjan
%Y North, Kai
%Y Komachi, Mamoru
%S Proceedings of the 20th International Workshop on Semantic Evaluation (2026)
%D 2026
%8 July
%I Association for Computational Linguistics
%C San Diego, California, USA
%@ 979-8-89176-414-9
%F nguyen-nguyen-2026-dangnt
%X We describe DANGNT@SGU’s system for the English track of SemEval-2026 Task 1 (MWAHAHA), Subtask A (text-based humor generation). Our pipeline combines a two-stage QLoRA-adapted generator based on mistralai/Mistral-7B-Instruct-v0.2 with a DistilBERT reranker trained to distinguish jokes from non-jokes. The generator is first adapted on a raw joke corpus for general humor style, then further tuned on synthetic task-format instruction–response pairs for Word Inclusion and News Headlineprompts. At inference time, we generate five candidates per input, optionally enforce lexical constraints for Word Inclusion prompts, and rerank candidates with the classifier. In the official English Subtask A results, our team DANGNT@SGU obtained Elo 962 (95% CI: 926–986), ranking 13th. The system is practical, reproducible, and based entirely on open models and public data.
%U https://aclanthology.org/2026.semeval-1.375/
%P 2986-2990
Markdown (Informal)
[DANGNT@SGU at SemEval-2026 Task 1: A Two-Stage Mistral Generator with DistilBERT Reranking for English Humor Generation](https://aclanthology.org/2026.semeval-1.375/) (Nguyen & Nguyen, SemEval 2026)
ACL