@inproceedings{shahzad-etal-2026-upr,
title = "{UPR} at {S}em{E}val-2026 Task 9: Multi-Label Classification of Polarization Across Social Dimensions and Manifestation Identification in {U}rdu",
author = "Shahzad, Mtayyaba and
Khadam, Inzmam and
Mahmood, Zaufishan and
Rashid, Junaid and
Hayat, Shamaila and
Ayub, Fakhar",
editor = "Kochmar, Ekaterina and
Ghosh, Debanjan and
North, Kai and
Komachi, Mamoru",
booktitle = "Proceedings of the 20th {I}nternational {W}orkshop on {S}emantic {E}valuation (2026)",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2026.semeval-1.333/",
pages = "2642--2647",
ISBN = "979-8-89176-414-9",
abstract = "The analysis of polarized content on social networks is crucial for understanding public discourse; however, research on low-resource languages such as Urdu remains limited. In this work, we address two complementary subtasks of polarization analysis in Urdu social media text. First, we formulate polarization classification across multiple social dimensions as a multi-label task, including political, religious, racial/ethnic, gender/sexual, and other. We fine-tune XLM-RoBERTa for multi-label classification with language-specific preprocessing, duplicate filtering, and data augmentation to handle class imbalance. The proposed model achieves a Macro F1-score of 0.758 for social-dimension polarization classification.Second, we perform polarization manifestation identification, focusing on how polarization is expressed in text through six manifestations: stereotype, vilification, dehumanization, extreme language, lack of empathy, and invalidation. Using the same transformer-based framework with imbalance-aware training, our system achieves a Macro F1-score of 0.72 on the official test set. These results demonstrate the effectiveness of multilingual transformer models for multi-dimensional polarization analysis in low-resource Urdu text."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="shahzad-etal-2026-upr">
<titleInfo>
<title>UPR at SemEval-2026 Task 9: Multi-Label Classification of Polarization Across Social Dimensions and Manifestation Identification in Urdu</title>
</titleInfo>
<name type="personal">
<namePart type="given">Mtayyaba</namePart>
<namePart type="family">Shahzad</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Inzmam</namePart>
<namePart type="family">Khadam</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Zaufishan</namePart>
<namePart type="family">Mahmood</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Junaid</namePart>
<namePart type="family">Rashid</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Shamaila</namePart>
<namePart type="family">Hayat</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Fakhar</namePart>
<namePart type="family">Ayub</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2026-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 20th International Workshop on Semantic Evaluation (2026)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Ekaterina</namePart>
<namePart type="family">Kochmar</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Debanjan</namePart>
<namePart type="family">Ghosh</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kai</namePart>
<namePart type="family">North</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mamoru</namePart>
<namePart type="family">Komachi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">San Diego, California, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-414-9</identifier>
</relatedItem>
<abstract>The analysis of polarized content on social networks is crucial for understanding public discourse; however, research on low-resource languages such as Urdu remains limited. In this work, we address two complementary subtasks of polarization analysis in Urdu social media text. First, we formulate polarization classification across multiple social dimensions as a multi-label task, including political, religious, racial/ethnic, gender/sexual, and other. We fine-tune XLM-RoBERTa for multi-label classification with language-specific preprocessing, duplicate filtering, and data augmentation to handle class imbalance. The proposed model achieves a Macro F1-score of 0.758 for social-dimension polarization classification.Second, we perform polarization manifestation identification, focusing on how polarization is expressed in text through six manifestations: stereotype, vilification, dehumanization, extreme language, lack of empathy, and invalidation. Using the same transformer-based framework with imbalance-aware training, our system achieves a Macro F1-score of 0.72 on the official test set. These results demonstrate the effectiveness of multilingual transformer models for multi-dimensional polarization analysis in low-resource Urdu text.</abstract>
<identifier type="citekey">shahzad-etal-2026-upr</identifier>
<location>
<url>https://aclanthology.org/2026.semeval-1.333/</url>
</location>
<part>
<date>2026-07</date>
<extent unit="page">
<start>2642</start>
<end>2647</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T UPR at SemEval-2026 Task 9: Multi-Label Classification of Polarization Across Social Dimensions and Manifestation Identification in Urdu
%A Shahzad, Mtayyaba
%A Khadam, Inzmam
%A Mahmood, Zaufishan
%A Rashid, Junaid
%A Hayat, Shamaila
%A Ayub, Fakhar
%Y Kochmar, Ekaterina
%Y Ghosh, Debanjan
%Y North, Kai
%Y Komachi, Mamoru
%S Proceedings of the 20th International Workshop on Semantic Evaluation (2026)
%D 2026
%8 July
%I Association for Computational Linguistics
%C San Diego, California, USA
%@ 979-8-89176-414-9
%F shahzad-etal-2026-upr
%X The analysis of polarized content on social networks is crucial for understanding public discourse; however, research on low-resource languages such as Urdu remains limited. In this work, we address two complementary subtasks of polarization analysis in Urdu social media text. First, we formulate polarization classification across multiple social dimensions as a multi-label task, including political, religious, racial/ethnic, gender/sexual, and other. We fine-tune XLM-RoBERTa for multi-label classification with language-specific preprocessing, duplicate filtering, and data augmentation to handle class imbalance. The proposed model achieves a Macro F1-score of 0.758 for social-dimension polarization classification.Second, we perform polarization manifestation identification, focusing on how polarization is expressed in text through six manifestations: stereotype, vilification, dehumanization, extreme language, lack of empathy, and invalidation. Using the same transformer-based framework with imbalance-aware training, our system achieves a Macro F1-score of 0.72 on the official test set. These results demonstrate the effectiveness of multilingual transformer models for multi-dimensional polarization analysis in low-resource Urdu text.
%U https://aclanthology.org/2026.semeval-1.333/
%P 2642-2647
Markdown (Informal)
[UPR at SemEval-2026 Task 9: Multi-Label Classification of Polarization Across Social Dimensions and Manifestation Identification in Urdu](https://aclanthology.org/2026.semeval-1.333/) (Shahzad et al., SemEval 2026)
ACL