%Aigaion2 BibTeX export from Idiap Publications %Tuesday 10 December 2024 12:26:47 PM @INPROCEEDINGS{tsamuel:interspeech-2:2008, author = {Thomas, Samuel and Ganapathy, Sriram and Hermansky, Hynek}, projects = {Idiap}, title = {Hilbert Envelope Based Spectro-Temporal Features for Phoneme Recognition in Telephone Speech}, booktitle = {Interspeech 2008}, year = {2008}, note = {IDIAP-RR 08-18}, crossref = {tsamuel:rr08-18}, abstract = {In this paper, we present a spectro-temporal feature extraction technique using sub-band Hilbert envelopes of relatively long segments of speech signal. Hilbert envelopes of the sub-bands are estimated using Frequency Domain Linear Prediction (FDLP). Spectral features are derived by integrating the sub-band Hilbert envelopes in short-term frames and the temporal features are formed by converting the FDLP envelopes into modulation frequency components. These are then combined at the phoneme posterior level and are used as the input features for a phoneme recognition system. In order to improve the robustness of the proposed features to telephone speech, the sub-band temporal envelopes are gain normalized prior to feature extraction. Phoneme recognition experiments on telephone speech in the HTIMIT database show significant performance improvements for the proposed features when compared to other robust feature techniques (average relative reduction of $11\%$ in phoneme error rate).}, pdf = {https://publications.idiap.ch/attachments/papers/2008/tsamuel-interspeech-2-2008.pdf}, postscript = {ftp://ftp.idiap.ch/pub/papers/2008/tsamuel-interspeech-2-2008.ps.gz}, ipdmembership={speech}, } crossreferenced publications: @TECHREPORT{tsamuel:rr08-18, author = {Thomas, Samuel and Ganapathy, Sriram and Hermansky, Hynek}, projects = {Idiap}, title = {Hilbert Envelope Based Specto-Temporal Features for Phoneme Recognition in Telephone Speech}, type = {Idiap-RR}, number = {Idiap-RR-18-2008}, year = {2008}, institution = {IDIAP}, abstract = {In this paper, we present a spectro-temporal feature extraction technique using sub-band Hilbert envelopes of relatively long segments of speech signal. Hilbert envelopes of the sub-bands are estimated using Frequency Domain Linear Prediction (FDLP). Spectral features are derived by integrating the sub-band Hilbert envelopes in short-term frames and the temporal features are formed by converting the FDLP envelopes into modulation frequency components. These are then combined at the phoneme posterior level and are used as the input features for a phoneme recognition system. In order to improve the robustness of the proposed features to telephone speech, the sub-band temporal envelopes are gain normalized prior to feature extraction. Phoneme recognition experiments on telephone speech in the HTIMIT database show significant performance improvements for the proposed features when compared to other robust feature techniques (average relative reduction of $11\%$ in phoneme error rate).}, pdf = {https://publications.idiap.ch/attachments/reports/2008/tsamuel-idiap-rr-08-18.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2008/tsamuel-idiap-rr-08-18.ps.gz}, ipdmembership={speech}, }