@inproceedings{muthuramalingam-etal-2024-chirp,
title = "Chirp Group Delay based Feature for Speech Applications",
author = "Muthuramalingam, Malarvizhi and
Gladston, Anushiya Rachel and
Vijayalakshmi, P and
Nagarajan, T",
editor = "Lalitha Devi, Sobha and
Arora, Karunesh",
booktitle = "Proceedings of the 21st International Conference on Natural Language Processing (ICON)",
month = dec,
year = "2024",
address = "AU-KBC Research Centre, Chennai, India",
publisher = "NLP Association of India (NLPAI)",
url = "https://aclanthology.org/2024.icon-1.52/",
pages = "449--453",
abstract = "Conventional Fast Fourier Transform (FFT),computed on the unit circle, gives an accurate representation of the spectrum if the signal under consideration is because of the sustained oscillations. However, practical signals are not sustained oscillations. For the signals that are either decaying/growing along time, the phase spectrum computed using conventional FFT is not accurate, and in turn, the magnitude spectrum too. Hence a feature, based on a variant of the group delay spectrum, namely the chirp group delay (CGD) spectrum, is proposed. The efficacy of the proposed feature is evaluated in Gaussian Mixture Model (GMM) and Convolutional Neural Network (CNN)-based speaker identification systems. Analysis reveals a significant increase in performance when using the CGD-based feature over the magnitude spectrum."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="muthuramalingam-etal-2024-chirp">
<titleInfo>
<title>Chirp Group Delay based Feature for Speech Applications</title>
</titleInfo>
<name type="personal">
<namePart type="given">Malarvizhi</namePart>
<namePart type="family">Muthuramalingam</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Anushiya</namePart>
<namePart type="given">Rachel</namePart>
<namePart type="family">Gladston</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">P</namePart>
<namePart type="family">Vijayalakshmi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">T</namePart>
<namePart type="family">Nagarajan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2024-12</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 21st International Conference on Natural Language Processing (ICON)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Sobha</namePart>
<namePart type="family">Lalitha Devi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Karunesh</namePart>
<namePart type="family">Arora</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>NLP Association of India (NLPAI)</publisher>
<place>
<placeTerm type="text">AU-KBC Research Centre, Chennai, India</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Conventional Fast Fourier Transform (FFT),computed on the unit circle, gives an accurate representation of the spectrum if the signal under consideration is because of the sustained oscillations. However, practical signals are not sustained oscillations. For the signals that are either decaying/growing along time, the phase spectrum computed using conventional FFT is not accurate, and in turn, the magnitude spectrum too. Hence a feature, based on a variant of the group delay spectrum, namely the chirp group delay (CGD) spectrum, is proposed. The efficacy of the proposed feature is evaluated in Gaussian Mixture Model (GMM) and Convolutional Neural Network (CNN)-based speaker identification systems. Analysis reveals a significant increase in performance when using the CGD-based feature over the magnitude spectrum.</abstract>
<identifier type="citekey">muthuramalingam-etal-2024-chirp</identifier>
<location>
<url>https://aclanthology.org/2024.icon-1.52/</url>
</location>
<part>
<date>2024-12</date>
<extent unit="page">
<start>449</start>
<end>453</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Chirp Group Delay based Feature for Speech Applications
%A Muthuramalingam, Malarvizhi
%A Gladston, Anushiya Rachel
%A Vijayalakshmi, P.
%A Nagarajan, T.
%Y Lalitha Devi, Sobha
%Y Arora, Karunesh
%S Proceedings of the 21st International Conference on Natural Language Processing (ICON)
%D 2024
%8 December
%I NLP Association of India (NLPAI)
%C AU-KBC Research Centre, Chennai, India
%F muthuramalingam-etal-2024-chirp
%X Conventional Fast Fourier Transform (FFT),computed on the unit circle, gives an accurate representation of the spectrum if the signal under consideration is because of the sustained oscillations. However, practical signals are not sustained oscillations. For the signals that are either decaying/growing along time, the phase spectrum computed using conventional FFT is not accurate, and in turn, the magnitude spectrum too. Hence a feature, based on a variant of the group delay spectrum, namely the chirp group delay (CGD) spectrum, is proposed. The efficacy of the proposed feature is evaluated in Gaussian Mixture Model (GMM) and Convolutional Neural Network (CNN)-based speaker identification systems. Analysis reveals a significant increase in performance when using the CGD-based feature over the magnitude spectrum.
%U https://aclanthology.org/2024.icon-1.52/
%P 449-453
Markdown (Informal)
[Chirp Group Delay based Feature for Speech Applications](https://aclanthology.org/2024.icon-1.52/) (Muthuramalingam et al., ICON 2024)
ACL
- Malarvizhi Muthuramalingam, Anushiya Rachel Gladston, P Vijayalakshmi, and T Nagarajan. 2024. Chirp Group Delay based Feature for Speech Applications. In Proceedings of the 21st International Conference on Natural Language Processing (ICON), pages 449–453, AU-KBC Research Centre, Chennai, India. NLP Association of India (NLPAI).