%Aigaion2 BibTeX export from Idiap Publications %Friday 22 November 2024 03:38:30 PM @INPROCEEDINGS{aradilla:mlmi:2007, author = {Aradilla, Guillermo and Bourlard, Herv{\'{e}}}, projects = {Idiap}, title = {Posterior-Based Features and Distances in Template Matching for Speech Recognition}, booktitle = {4th Joint Workshop on Multimodal Interaction and Related Machine Learning Algorithms ({MLMI})}, year = {2007}, note = {IDIAP-RR 07-41}, crossref = {aradilla:rr07-41}, abstract = {The use of large speech corpora in example-based approaches for speech recognition is mainly focused on increasing the number of examples. This strategy presents some difficulties because databases may not provide enough examples for some rare words. In this paper we present a different method to incorporate the information contained in such corpora in these example-based systems. A multilayer perceptron is trained on these databases to estimate speaker and task-independent phoneme posterior probabilities, which are used as speech features. By reducing the variability of features, fewer examples are needed to properly characterize a word. In this way, performance can be highly improved when limited number of examples is available. Moreover, we also study posterior-based local distances, these result more effective than traditional Euclidean distance. Experiments on Phonebook database support the idea that posterior features with a proper local distance can yield competitive results.}, pdf = {https://publications.idiap.ch/attachments/papers/2007/aradilla-mlmi-2007.pdf}, postscript = {ftp://ftp.idiap.ch/pub/papers/2007/aradilla-mlmi-2007.ps.gz}, ipdmembership={speech}, } crossreferenced publications: @TECHREPORT{aradilla:rr07-41, author = {Aradilla, Guillermo and Bourlard, Herv{\'{e}}}, projects = {Idiap}, title = {Posterior-Based Features and Distances in Template Matching for Speech Recognition}, type = {Idiap-RR}, number = {Idiap-RR-41-2007}, year = {2007}, institution = {IDIAP}, abstract = {The use of large speech corpora in example-based approaches for speech recognition is mainly focused on increasing the number of examples. This strategy presents some difficulties because databases may not provide enough examples for some rare words. In this paper we present a different method to incorporate the information contained in such corpora in these example-based systems. A multilayer perceptron is trained on these databases to estimate speaker and task-independent phoneme posterior probabilities, which are used as speech features. By reducing the variability of features, fewer examples are needed to properly characterize a word. In this way, performance can be highly improved when limited number of examples is available. Moreover, we also study posterior-based local distances, these result more effective than traditional Euclidean distance. Experiments on Phonebook database support the idea that posterior features with a proper local distance can yield competitive results.}, pdf = {https://publications.idiap.ch/attachments/reports/2007/aradilla-idiap-rr-07-41.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2007/aradilla-idiap-rr-07-41.ps.gz}, ipdmembership={speech}, }