@inproceedings{firmino-etal-2026-retrato,
title = "{R}etrato{\_}{C}antado: Cria{\c{c}}{\~a}o e An{\'a}lise de um Corpus para Representa{\c{c}}{\~o}es de Identidade em Letras de M{\'u}sicas Brasileiras",
author = "Firmino, Vit{\'o}ria P. and
Lopes, Janaina N. de S. and
Nogueira, Bruno M. and
Reis, Val{\'e}ria Q. dos",
editor = "Souza, Marlo and
de-Dios-Flores, Iria and
Santos, Diana and
Freitas, Larissa and
Souza, Jackson Wilke da Cruz and
Ribeiro, Eug{\'e}nio",
booktitle = "Proceedings of the 17th International Conference on Computational Processing of {P}ortuguese ({PROPOR} 2026) - Vol. 1",
month = apr,
year = "2026",
address = "Salvador, Brazil",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2026.propor-1.68/",
pages = "687--696",
ISBN = "979-8-89176-387-6",
abstract = "This paper presents the development of Retrato{\_}Cantado, a dataset of sentences extracted from Brazilian song lyrics and manually annotated to identify and categorize predicative constructions that describe individuals. The corpus findings validate the effectiveness of lexical-syntactic patterns for identifying predicative sentences, confirming their suitability for large-scale linguistic annotation tasks. The dataset also serves as a valuable resource for the analysis of textual discourse and the representation of social groups in Brazilian culture. We additionally trained a person-characterization classifier to illustrate the applicability of the dataset to the automatic detection of predicative descriptions, which achieved high accuracy and highlights the potential for creating more specialized models capable of detecting physical and sociocognitive categories, as well as performing sentiment polarity analysis."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="firmino-etal-2026-retrato">
<titleInfo>
<title>Retrato_Cantado: Criação e Análise de um Corpus para Representações de Identidade em Letras de Músicas Brasileiras</title>
</titleInfo>
<name type="personal">
<namePart type="given">Vitória</namePart>
<namePart type="given">P</namePart>
<namePart type="family">Firmino</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Janaina</namePart>
<namePart type="given">N</namePart>
<namePart type="given">de</namePart>
<namePart type="given">S</namePart>
<namePart type="family">Lopes</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Bruno</namePart>
<namePart type="given">M</namePart>
<namePart type="family">Nogueira</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Valéria</namePart>
<namePart type="given">Q</namePart>
<namePart type="given">dos</namePart>
<namePart type="family">Reis</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2026-04</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 17th International Conference on Computational Processing of Portuguese (PROPOR 2026) - Vol. 1</title>
</titleInfo>
<name type="personal">
<namePart type="given">Marlo</namePart>
<namePart type="family">Souza</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Iria</namePart>
<namePart type="family">de-Dios-Flores</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Diana</namePart>
<namePart type="family">Santos</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Larissa</namePart>
<namePart type="family">Freitas</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jackson</namePart>
<namePart type="given">Wilke</namePart>
<namePart type="given">da</namePart>
<namePart type="given">Cruz</namePart>
<namePart type="family">Souza</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Eugénio</namePart>
<namePart type="family">Ribeiro</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Salvador, Brazil</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-387-6</identifier>
</relatedItem>
<abstract>This paper presents the development of Retrato_Cantado, a dataset of sentences extracted from Brazilian song lyrics and manually annotated to identify and categorize predicative constructions that describe individuals. The corpus findings validate the effectiveness of lexical-syntactic patterns for identifying predicative sentences, confirming their suitability for large-scale linguistic annotation tasks. The dataset also serves as a valuable resource for the analysis of textual discourse and the representation of social groups in Brazilian culture. We additionally trained a person-characterization classifier to illustrate the applicability of the dataset to the automatic detection of predicative descriptions, which achieved high accuracy and highlights the potential for creating more specialized models capable of detecting physical and sociocognitive categories, as well as performing sentiment polarity analysis.</abstract>
<identifier type="citekey">firmino-etal-2026-retrato</identifier>
<location>
<url>https://aclanthology.org/2026.propor-1.68/</url>
</location>
<part>
<date>2026-04</date>
<extent unit="page">
<start>687</start>
<end>696</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Retrato_Cantado: Criação e Análise de um Corpus para Representações de Identidade em Letras de Músicas Brasileiras
%A Firmino, Vitória P.
%A Lopes, Janaina N. de S.
%A Nogueira, Bruno M.
%A Reis, Valéria Q. dos
%Y Souza, Marlo
%Y de-Dios-Flores, Iria
%Y Santos, Diana
%Y Freitas, Larissa
%Y Souza, Jackson Wilke da Cruz
%Y Ribeiro, Eugénio
%S Proceedings of the 17th International Conference on Computational Processing of Portuguese (PROPOR 2026) - Vol. 1
%D 2026
%8 April
%I Association for Computational Linguistics
%C Salvador, Brazil
%@ 979-8-89176-387-6
%F firmino-etal-2026-retrato
%X This paper presents the development of Retrato_Cantado, a dataset of sentences extracted from Brazilian song lyrics and manually annotated to identify and categorize predicative constructions that describe individuals. The corpus findings validate the effectiveness of lexical-syntactic patterns for identifying predicative sentences, confirming their suitability for large-scale linguistic annotation tasks. The dataset also serves as a valuable resource for the analysis of textual discourse and the representation of social groups in Brazilian culture. We additionally trained a person-characterization classifier to illustrate the applicability of the dataset to the automatic detection of predicative descriptions, which achieved high accuracy and highlights the potential for creating more specialized models capable of detecting physical and sociocognitive categories, as well as performing sentiment polarity analysis.
%U https://aclanthology.org/2026.propor-1.68/
%P 687-696
Markdown (Informal)
[Retrato_Cantado: Criação e Análise de um Corpus para Representações de Identidade em Letras de Músicas Brasileiras](https://aclanthology.org/2026.propor-1.68/) (Firmino et al., PROPOR 2026)
ACL