@inproceedings{truong-etal-2025-dfat,
title = "{DFAT}: Dual-stage Fusion of Acoustic and Text feature for Speech Emotion Recognition",
author = "Truong, Nhi Nguyen Yen and
Quang, Sang Le and
Quang, Huy Tran and
Xuan, Tri Pham and
Ham, Duong Tran and
Hai, Binh Tran Le and
Huynh, Tin and
Hoang, Kiem",
editor = "Mai, Luong Chi and
Huyen, Nguyen Thi Minh and
Trang, Nguyen Thi Thu",
booktitle = "Proceedings of the 11th International Workshop on Vietnamese Language and Speech Processing",
month = oct,
year = "2025",
address = "Hanoi, Vietnam",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2025.vlsp-1.6/",
pages = "36--44"
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="truong-etal-2025-dfat">
<titleInfo>
<title>DFAT: Dual-stage Fusion of Acoustic and Text feature for Speech Emotion Recognition</title>
</titleInfo>
<name type="personal">
<namePart type="given">Nhi</namePart>
<namePart type="given">Nguyen</namePart>
<namePart type="given">Yen</namePart>
<namePart type="family">Truong</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Sang</namePart>
<namePart type="given">Le</namePart>
<namePart type="family">Quang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Huy</namePart>
<namePart type="given">Tran</namePart>
<namePart type="family">Quang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tri</namePart>
<namePart type="given">Pham</namePart>
<namePart type="family">Xuan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Duong</namePart>
<namePart type="given">Tran</namePart>
<namePart type="family">Ham</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Binh</namePart>
<namePart type="given">Tran</namePart>
<namePart type="given">Le</namePart>
<namePart type="family">Hai</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tin</namePart>
<namePart type="family">Huynh</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kiem</namePart>
<namePart type="family">Hoang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2025-10</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 11th International Workshop on Vietnamese Language and Speech Processing</title>
</titleInfo>
<name type="personal">
<namePart type="given">Luong</namePart>
<namePart type="given">Chi</namePart>
<namePart type="family">Mai</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nguyen</namePart>
<namePart type="given">Thi</namePart>
<namePart type="given">Minh</namePart>
<namePart type="family">Huyen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nguyen</namePart>
<namePart type="given">Thi</namePart>
<namePart type="given">Thu</namePart>
<namePart type="family">Trang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Hanoi, Vietnam</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<identifier type="citekey">truong-etal-2025-dfat</identifier>
<location>
<url>https://aclanthology.org/2025.vlsp-1.6/</url>
</location>
<part>
<date>2025-10</date>
<extent unit="page">
<start>36</start>
<end>44</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T DFAT: Dual-stage Fusion of Acoustic and Text feature for Speech Emotion Recognition
%A Truong, Nhi Nguyen Yen
%A Quang, Sang Le
%A Quang, Huy Tran
%A Xuan, Tri Pham
%A Ham, Duong Tran
%A Hai, Binh Tran Le
%A Huynh, Tin
%A Hoang, Kiem
%Y Mai, Luong Chi
%Y Huyen, Nguyen Thi Minh
%Y Trang, Nguyen Thi Thu
%S Proceedings of the 11th International Workshop on Vietnamese Language and Speech Processing
%D 2025
%8 October
%I Association for Computational Linguistics
%C Hanoi, Vietnam
%F truong-etal-2025-dfat
%U https://aclanthology.org/2025.vlsp-1.6/
%P 36-44
Markdown (Informal)
[DFAT: Dual-stage Fusion of Acoustic and Text feature for Speech Emotion Recognition](https://aclanthology.org/2025.vlsp-1.6/) (Truong et al., VLSP 2025)
ACL
- Nhi Nguyen Yen Truong, Sang Le Quang, Huy Tran Quang, Tri Pham Xuan, Duong Tran Ham, Binh Tran Le Hai, Tin Huynh, and Kiem Hoang. 2025. DFAT: Dual-stage Fusion of Acoustic and Text feature for Speech Emotion Recognition. In Proceedings of the 11th International Workshop on Vietnamese Language and Speech Processing, pages 36–44, Hanoi, Vietnam. Association for Computational Linguistics.