%Aigaion2 BibTeX export from Idiap Publications %Saturday 21 December 2024 04:40:56 PM @INPROCEEDINGS{Fritsch_ICASSP_2020, author = {Fritsch, Julian and Dubagunta, S. Pavankumar and Magimai.-Doss, Mathew}, keywords = {articulatory features, Convolutional Neural Networks, end-to-end acoustic modeling, Paralinguistic speech processing, sleepiness}, projects = {TAPAS}, month = may, title = {Estimating The Degree of Sleepiness by Integrating Articulatory Feature Knowledge In Raw Waveform Based CNNs}, booktitle = {International Conference on Acoustics, Speech, and Signal Processing (ICASSP)}, year = {2020}, location = {Barcelona, Spain}, crossref = {Fritsch_Idiap-RR-06-2019}, abstract = {Speech-based degree of sleepiness estimation is an emerging research problem. This paper investigates an end-to-end approach, where given raw waveform as input, a convolutional neural network (CNN) estimates at its output the degree of sleepiness. Within this approach, we investigate constraining the first layer processing and integration of speech production knowledge through transfer learning. We evaluate these methods on the continuous sleepiness corpus of the Interspeech 2019 Computational Paralinguistics (ComParE) Challenge and demonstrate that the proposed approach consistently yields competitive systems. In particular, we observe that integration of speech production knowledge aids in improving the performance and yields systems that are complementary.}, pdf = {https://publications.idiap.ch/attachments/papers/2020/Fritsch_ICASSP_2020.pdf} } crossreferenced publications: @TECHREPORT{Fritsch_Idiap-RR-06-2019, author = {Fritsch, Julian and Dubagunta, S. Pavankumar and Magimai.-Doss, Mathew}, projects = {TAPAS}, month = {2}, title = {Estimating The Degree of Sleepiness by Integrating Articulatory Feature Knowledge In Raw Waveform Based CNNs}, type = {Idiap-RR}, number = {Idiap-RR-06-2020}, year = {2019}, institution = {Idiap}, abstract = {Speech-based degree of sleepiness estimation is an emerging research problem. In the literature, this problem has been mainly addressed through modeling of low level of descriptors. This paper investigates an end-to-end approach, where given raw waveform as input, a neural network estimates at its output the degree of sleepiness. Through an investigation on the continuous sleepiness sub-challenge of the INTERSPEECH 2019 Computational Paralinguistics Challenge, we show that the proposed approach consistently yields performance comparable or better than low level descriptor-based, bag-of-audio-words-based and sequence-to-sequence autoencoder feature representation-based regression systems. Furthermore, a confusion matrix analysis on the development set shows that, unlike the best baseline system, the performance of our approach is not centering around a few degrees of sleepiness, but is spread across all the degrees of sleepiness.}, pdf = {https://publications.idiap.ch/attachments/reports/2019/Fritsch_Idiap-RR-06-2020.pdf} }