%Aigaion2 BibTeX export from Idiap Publications %Saturday 21 December 2024 07:24:40 PM @INPROCEEDINGS{sgarimel:is:2008, author = {Sivaram, G. S. V. S. and Hermansky, Hynek}, projects = {Idiap}, title = {Introducing Temporal Asymmetries in Feature Extraction for Automatic Speech Recognition}, booktitle = {Interspeech 2008}, year = {2008}, note = {IDIAP-RR 08-25}, crossref = {sgarimel:rr08-25}, abstract = {We propose a new auditory inspired feature extraction technique for automatic speech recognition (ASR). Features are extracted by filtering the temporal trajectory of spectral energies in each critical band of speech by a bank of finite impulse response (FIR) filters. Impulse responses of these filters are derived from a modified Gabor envelope in order to emulate asymmetries of the temporal receptive field (TRF) profiles observed in higher level auditory neurons. We obtain $11.4\% $ relative improvement in word error rate on OGI-Digits database and, $3.2\%$ relative improvement in phoneme error rate on TIMIT database over the MRASTA technique.}, pdf = {https://publications.idiap.ch/attachments/papers/2008/sgarimel-is-2008.pdf}, postscript = {ftp://ftp.idiap.ch/pub/papers/2008/sgarimel-is-2008.ps.gz}, ipdmembership={speech}, } crossreferenced publications: @TECHREPORT{sgarimel:rr08-25, author = {Sivaram, G. S. V. S. and Hermansky, Hynek}, projects = {Idiap}, title = {Introducing Temporal Asymmetries in Feature Extraction for Automatic Speech Recognition}, type = {Idiap-RR}, number = {Idiap-RR-25-2008}, year = {2008}, institution = {IDIAP}, abstract = {We propose a new auditory inspired feature extraction technique for automatic speech recognition (ASR). Features are extracted by filtering the temporal trajectory of spectral energies in each critical band of speech by a bank of finite impulse response (FIR) filters. Impulse responses of these filters are derived from a modified Gabor envelope in order to emulate asymmetries of the temporal receptive field (TRF) profiles observed in higher level auditory neurons. We obtain $11.4\% $ relative improvement in word error rate on OGI-Digits database and, $3.2\%$ relative improvement in phoneme error rate on TIMIT database over the MRASTA technique.}, pdf = {https://publications.idiap.ch/attachments/reports/2008/sgarimel-idiap-rr-08-25.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2008/sgarimel-idiap-rr-08-25.ps.gz}, ipdmembership={speech}, }