%Aigaion2 BibTeX export from Idiap Publications %Thursday 21 November 2024 12:57:25 PM @TECHREPORT{Parthasarathi_Idiap-RR-14-2011, author = {Parthasarathi, Sree Hari Krishnan and Bourlard, Herv{\'{e}} and Gatica-Perez, Daniel}, projects = {Idiap, SNSF-MULTI}, month = {5}, title = {LP Residual Features for Robust, Privacy-Sensitive Speaker Diarization}, type = {Idiap-RR}, number = {Idiap-RR-14-2011}, year = {2011}, institution = {Idiap}, abstract = {We present a comprehensive study of linear prediction residual for speaker diarization on single and multiple distant microphone conditions in privacy-sensitive settings, a requirement to analyze a wide range of spontaneous conversations. Two representations of the residual are compared, namely real-cepstrum and MFCC, with the latter performing better. Experiments on RT06eval show that residual with subband information from 2.5 kHz to 3.5 kHz and spectral slope yields a performance close to traditional MFCC features. As a way to objectively evaluate privacy in terms of linguistic information, we perform phoneme recognition. Residual features yield low phoneme accuracies compared to traditional MFCC features.}, pdf = {https://publications.idiap.ch/attachments/reports/2011/Parthasarathi_Idiap-RR-14-2011.pdf} }