%Aigaion2 BibTeX export from Idiap Publications
%Thursday 21 November 2024 11:48:13 AM

@INPROCEEDINGS{sgarimel:is:2008,
         author = {Sivaram, G. S. V. S. and Hermansky, Hynek},
       projects = {Idiap},
          title = {Introducing Temporal Asymmetries in Feature Extraction for Automatic Speech Recognition},
      booktitle = {Interspeech 2008},
           year = {2008},
           note = {IDIAP-RR 08-25},
       crossref = {sgarimel:rr08-25},
       abstract = {We propose a new auditory inspired feature extraction technique for automatic speech recognition (ASR). Features are extracted by filtering the temporal trajectory of spectral energies in each critical band of speech by a bank of finite impulse response (FIR) filters. Impulse responses of these filters are derived from a modified Gabor envelope in order to emulate asymmetries of the temporal receptive field (TRF) profiles observed in higher level auditory neurons. We obtain $11.4\% $ relative improvement in word error rate on OGI-Digits database and, $3.2\%$ relative improvement in phoneme error rate on TIMIT database over the MRASTA technique.},
            pdf = {https://publications.idiap.ch/attachments/papers/2008/sgarimel-is-2008.pdf},
     postscript = {ftp://ftp.idiap.ch/pub/papers/2008/sgarimel-is-2008.ps.gz},
ipdmembership={speech},
}



crossreferenced publications: 
@TECHREPORT{sgarimel:rr08-25,
         author = {Sivaram, G. S. V. S. and Hermansky, Hynek},
       projects = {Idiap},
          title = {Introducing Temporal Asymmetries in Feature Extraction for Automatic Speech Recognition},
           type = {Idiap-RR},
         number = {Idiap-RR-25-2008},
           year = {2008},
    institution = {IDIAP},
       abstract = {We propose a new auditory inspired feature extraction technique for automatic speech recognition (ASR). Features are extracted by filtering the temporal trajectory of spectral energies in each critical band of speech by a bank of finite impulse response (FIR) filters. Impulse responses of these filters are derived from a modified Gabor envelope in order to emulate asymmetries of the temporal receptive field (TRF) profiles observed in higher level auditory neurons. We obtain $11.4\% $ relative improvement in word error rate on OGI-Digits database and, $3.2\%$ relative improvement in phoneme error rate on TIMIT database over the MRASTA technique.},
            pdf = {https://publications.idiap.ch/attachments/reports/2008/sgarimel-idiap-rr-08-25.pdf},
     postscript = {ftp://ftp.idiap.ch/pub/reports/2008/sgarimel-idiap-rr-08-25.ps.gz},
ipdmembership={speech},
}