@inproceedings{wroblewska-2025-poleval,
title = "{P}ol{E}val 2025 Task 2: Gender-inclusive {LLM}s for {P}olish",
author = "Wr{\'o}blewska, Alina",
editor = "Kobyli{\'n}ski, {\L}ukasz and
Wr{\'o}blewska, Alina and
Ogrodniczuk, Maciej",
booktitle = "Proceedings of the {P}ol{E}val 2025 Workshop",
month = nov,
year = "2025",
address = "Warsaw",
publisher = "Institute of Computer Science PAS and Association for Computational Linguistics",
url = "https://aclanthology.org/2025.poleval-main.6/",
pages = "39--47",
abstract = "This paper presents the results of the PolEval 2025 shared task on gender-inclusive large language models for Polish. The primary goal of this task is to encourage the development of models capable of generating grammatically well-formed, contextually appropriate, and gender-inclusive output {---} a property of increasing importance in both human-centred NLP and NLG applications. To support this objective, we employed the newly developed Inclusive Polish Instruction Set (IPIS), a high-quality, human-annotated resource designed to guide models toward gender-inclusive behaviour. The shared task comprised two subtasks: gender-inclusive proofreading, which evaluates the ability of a model to transform masculine-generic Polish text into an inclusive equivalent, and gender-sensitive Polish-English translation, which investigates gender marking across languages. A total of six system submissions were received {---} three for each subtask. The evaluation demonstrates that the top-performing gender-inclusive systems outperform both the baseline and state-of-the-art models. These findings highlight the effectiveness of IPIS-tuned approaches and establish strong benchmarks for future research on gender inclusivity in Polish NLP."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="wroblewska-2025-poleval">
<titleInfo>
<title>PolEval 2025 Task 2: Gender-inclusive LLMs for Polish</title>
</titleInfo>
<name type="personal">
<namePart type="given">Alina</namePart>
<namePart type="family">Wróblewska</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2025-11</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the PolEval 2025 Workshop</title>
</titleInfo>
<name type="personal">
<namePart type="given">Łukasz</namePart>
<namePart type="family">Kobyliński</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Alina</namePart>
<namePart type="family">Wróblewska</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Maciej</namePart>
<namePart type="family">Ogrodniczuk</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Institute of Computer Science PAS and Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Warsaw</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper presents the results of the PolEval 2025 shared task on gender-inclusive large language models for Polish. The primary goal of this task is to encourage the development of models capable of generating grammatically well-formed, contextually appropriate, and gender-inclusive output — a property of increasing importance in both human-centred NLP and NLG applications. To support this objective, we employed the newly developed Inclusive Polish Instruction Set (IPIS), a high-quality, human-annotated resource designed to guide models toward gender-inclusive behaviour. The shared task comprised two subtasks: gender-inclusive proofreading, which evaluates the ability of a model to transform masculine-generic Polish text into an inclusive equivalent, and gender-sensitive Polish-English translation, which investigates gender marking across languages. A total of six system submissions were received — three for each subtask. The evaluation demonstrates that the top-performing gender-inclusive systems outperform both the baseline and state-of-the-art models. These findings highlight the effectiveness of IPIS-tuned approaches and establish strong benchmarks for future research on gender inclusivity in Polish NLP.</abstract>
<identifier type="citekey">wroblewska-2025-poleval</identifier>
<location>
<url>https://aclanthology.org/2025.poleval-main.6/</url>
</location>
<part>
<date>2025-11</date>
<extent unit="page">
<start>39</start>
<end>47</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T PolEval 2025 Task 2: Gender-inclusive LLMs for Polish
%A Wróblewska, Alina
%Y Kobyliński, Łukasz
%Y Wróblewska, Alina
%Y Ogrodniczuk, Maciej
%S Proceedings of the PolEval 2025 Workshop
%D 2025
%8 November
%I Institute of Computer Science PAS and Association for Computational Linguistics
%C Warsaw
%F wroblewska-2025-poleval
%X This paper presents the results of the PolEval 2025 shared task on gender-inclusive large language models for Polish. The primary goal of this task is to encourage the development of models capable of generating grammatically well-formed, contextually appropriate, and gender-inclusive output — a property of increasing importance in both human-centred NLP and NLG applications. To support this objective, we employed the newly developed Inclusive Polish Instruction Set (IPIS), a high-quality, human-annotated resource designed to guide models toward gender-inclusive behaviour. The shared task comprised two subtasks: gender-inclusive proofreading, which evaluates the ability of a model to transform masculine-generic Polish text into an inclusive equivalent, and gender-sensitive Polish-English translation, which investigates gender marking across languages. A total of six system submissions were received — three for each subtask. The evaluation demonstrates that the top-performing gender-inclusive systems outperform both the baseline and state-of-the-art models. These findings highlight the effectiveness of IPIS-tuned approaches and establish strong benchmarks for future research on gender inclusivity in Polish NLP.
%U https://aclanthology.org/2025.poleval-main.6/
%P 39-47
Markdown (Informal)
[PolEval 2025 Task 2: Gender-inclusive LLMs for Polish](https://aclanthology.org/2025.poleval-main.6/) (Wróblewska, PolEval 2025)
ACL