%Aigaion2 BibTeX export from Idiap Publications %Friday 22 November 2024 03:38:36 PM @INPROCEEDINGS{weber-ar-01-24, author = {Weber, Katrin and Bengio, Samy and Bourlard, Herv{\'{e}}}, projects = {Idiap}, month = {12}, title = {{S}peech {R}ecognition Using Advanced {HMM2} {F}eatures}, booktitle = {Automatic Speech Recognition and Understanding Workshop}, year = {2001}, address = {Madonna di Campiglio, Italy}, note = {IDIAP-rr 01-24}, crossref = {weber-rr-01-24}, abstract = {HMM2 is a particular hidden Markov model where state emission probabilities of the temporal (primary) HMM are modeled through (secondary) state-dependent frequency-based HMMs [12]. As shown in [13], a secondary HMM can also be used to extract robust ASR features. Here, we further investigate this novel approach towards using a full HMM2 as feature extractor, working in the spectral domain, and extracting robust formant-like features for standard ASR system. HMM2 performs a nonlinear, state-dependent frequency warping, and it is shown that the resulting frequency segmentation actually contains particularly discriminant features. To further improve the HMM2 system, we complement the initial spectral energy vectors with frequency information. Finally, adding temporal information to the HMM2 feature vector yields further improvements. These conclusions are experimentally validated on the Numbers95 database, where word error rates of 15\\%, using only a 4-dimensional feature vector (3 formant-like parameters and one time index) were obtained.}, pdf = {https://publications.idiap.ch/attachments/reports/2001/rr01-24.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2001/rr01-24.ps.gz}, ipdmembership={speech}, language={English}, } crossreferenced publications: @TECHREPORT{weber-rr-01-24, author = {Weber, Katrin and Bengio, Samy and Bourlard, Herv{\'{e}}}, projects = {Idiap}, title = {{S}peech {R}ecognition Using Advanced {HMM2} {F}eatures}, type = {Idiap-RR}, number = {Idiap-RR-24-2001}, year = {2001}, institution = {IDIAP}, address = {Martigny, Switzerland}, note = {Published: ASRU 2001, Madonna di Campiglio, Italy, December 2001}, abstract = {HMM2 is a particular hidden Markov model where state emission probabilities of the temporal (primary) HMM are modeled through (secondary) state-dependent frequency-based HMMs [12]. As shown in [13], a secondary HMM can also be used to extract robust ASR features. Here, we further investigate this novel approach towards using a full HMM2 as feature extractor, working in the spectral domain, and extracting robust formant-like features for standard ASR system. HMM2 performs a nonlinear, state-dependent frequency warping, and it is shown that the resulting frequency segmentation actually contains particularly discriminant features. To further improve the HMM2 system, we complement the initial spectral energy vectors with frequency information. Finally, adding temporal information to the HMM2 feature vector yields further improvements. These conclusions are experimentally validated on the Numbers95 database, where word error rates of 15\\%, using only a 4-dimensional feature vector (3 formant-like parameters and one time index) were obtained.}, pdf = {https://publications.idiap.ch/attachments/reports/2001/rr01-24.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2001/rr01-24.ps.gz}, ipdinar={2001}, ipdmembership={speech}, language={English}, }