%Aigaion2 BibTeX export from Idiap Publications %Saturday 21 December 2024 04:55:22 PM @INPROCEEDINGS{Asaei_SPARS_2017, author = {Asaei, Afsaneh and Cernak, Milos and Bourlard, Herv{\'{e}} and Ram, Dhananjay}, projects = {Idiap, PHASER-QUAD}, title = {Sparse Pronunciation Codes for Perceptual Phonetic Information Assessment}, booktitle = {Workshop on Signal Processing with Adaptive Sparse Structured Representations (SPARS)}, year = {2017}, note = {Proceeding of Abstracts for Communication}, abstract = {Speech is a complex signal produced by a highly constrained articulation machinery. Neuro and psycholinguistic theories assert that speech can be decomposed into molecules of structured atoms. Although characterization of the atoms is controversial, the experiments support the notion of invariant speech codes governing speech production and perception. We exploit deep neural network (DNN) invariant representation learning for probabilistic characterization of the phone attributes defined in terms of the phonological classes and known as the smallest-size perceptual categories. We cast speech perception as a channel for phoneme information transmission via the phone attributes. Structured sparse codes are identified from the phonological probabilities for natural speech pronunciation. We exploit the sparse codes in information transmission analysis for assessment of phoneme pronunciation. The linguists define a single binary phonological code per phoneme. In contrast, probabilistic estimation of the phonological classes enables us to capture large variation in structures of speech pronunciation. Hence, speech assessment may not be confined to the single expert knowledge based mapping between phoneme and phonological classes and it may be extended to multiple data-driven mappings observed in natural speech.}, pdf = {https://publications.idiap.ch/attachments/papers/2017/Asaei_SPARS_2017.pdf} }