%Aigaion2 BibTeX export from Idiap Publications %Saturday 21 December 2024 07:27:20 PM @INPROCEEDINGS{ikbal-rr-03-36p, author = {Ikbal, Shajith and Hermansky, Hynek and Bourlard, Herv{\'{e}}}, projects = {Idiap}, month = {12}, title = {{Nonlinear Spectral Transformations for Robust Speech Recognition}}, booktitle = {Proceedings of the IEEE Automatic Speech Recognition and Understanding (ASRU) Workshop 2003}, year = {2003}, address = {St. Thomas, U.S. Virgin Islands, USA}, crossref = {ikbal-rr-03-36}, abstract = {Recently, a nonlinear transformation of autocorrelation coefficients named Phase AutoCorrelation (PAC) coefficients has been considered for feature extraction \cite{ikbal03}. PAC based features show improved robustness to additive noise as a result of two operations, performed during the computation of PAC, namely energy normalization and inverse cosine transformation. In spite of the improved robustness achieved for noisy speech, these two operations lead to some degradation in recognition performance for clean speech. In this paper, we try to alleviate this problem, first by introducing the energy information back into the PAC based features, and second by studying alternatives to inverse cosine function. Simply appending the frame energy as an additional coefficient in the PAC features has resulted in noticeable improvement in the performance for clean speech. Study of alternatives to inverse cosine transformation leads to a conclusion that linear transformation is the best for clean speech, while nonlinear functions help to improve robustness in noise.}, pdf = {https://publications.idiap.ch/attachments/reports/2003/rr03-36.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2003/rr03-36.ps.gz}, ipdmembership={speech}, } crossreferenced publications: @TECHREPORT{ikbal-rr-03-36, author = {Ikbal, Shajith and Hermansky, Hynek and Bourlard, Herv{\'{e}}}, projects = {Idiap}, title = {{Nonlinear Spectral Transformations for Robust Speech Recognition}}, type = {Idiap-RR}, number = {Idiap-RR-36-2003}, year = {2003}, institution = {IDIAP}, address = {Martigny, Switzerland}, abstract = {Recently, a nonlinear transformation of autocorrelation coefficients named Phase AutoCorrelation (PAC) coefficients has been considered for feature extraction \cite{ikbal03}. PAC based features show improved robustness to additive noise as a result of two operations, performed during the computation of PAC, namely energy normalization and inverse cosine transformation. In spite of the improved robustness achieved for noisy speech, these two operations lead to some degradation in recognition performance for clean speech. In this paper, we try to alleviate this problem, first by introducing the energy information back into the PAC based features, and second by studying alternatives to inverse cosine function. Simply appending the frame energy as an additional coefficient in the PAC features has resulted in noticeable improvement in the performance for clean speech. Study of alternatives to inverse cosine transformation leads to a conclusion that linear transformation is the best for clean speech, while nonlinear functions help to improve robustness in noise.}, pdf = {https://publications.idiap.ch/attachments/reports/2003/rr03-36.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2003/rr03-36.ps.gz}, ipdinar={2003}, ipdmembership={speech}, language={English}, }