%Aigaion2 BibTeX export from Idiap Publications
%Saturday 21 December 2024 06:01:28 PM

@INPROCEEDINGS{Imseng_ASRU_2009,
         author = {Imseng, David and Friedland, Gerald},
       projects = {Idiap, AMIDA, IM2},
          month = {12},
          title = {Robust Speaker Diarization for Short Speech Recordings},
      booktitle = {Proceedings of the IEEE workshop on Automatic Speech Recognition and Understanding},
           year = {2009},
          pages = {432-437},
       location = {Merano, Italy},
       crossref = {Imseng_Idiap-RR-26-2009},
       abstract = {We investigate a state-of-the-art Speaker Diarization system regarding its behavior on meetings that are much shorter (from 500 seconds down to 100 seconds) than those typically analyzed in Speaker Diarization benchmarks. First, the problems inherent to this task are analyzed. Then, we propose an approach that consists of a novel initialization parameter estimation method for typical state-of-the-art diarization approaches. The estimation method balances the relationship between the optimal value of the duration of speech data per Gaussian and the duration of the speech data, which is verified experimentally for the first time in this article. As a result, the Diarization Error Rate for short meetings extracted from the 2006, 2007, and 2009 NIST RT evaluation data is decreased by up to 50\% relative.},
            pdf = {https://publications.idiap.ch/attachments/papers/2009/Imseng_ASRU_2009.pdf}
}



crossreferenced publications: 
@TECHREPORT{Imseng_Idiap-RR-26-2009,
         author = {Imseng, David and Friedland, Gerald},
       projects = {Idiap, AMIDA, IM2},
          month = {9},
          title = {Robust Speaker Diarization for Short Speech Recordings},
           type = {Idiap-RR},
         number = {Idiap-RR-26-2009},
           year = {2009},
    institution = {Idiap},
        address = {PO Box 592 CH - 1920 Martigny},
       abstract = {We investigate a state-of-the-art Speaker Diarization system regarding its behavior on meetings that are much shorter (from 500 seconds down to 100 seconds) than those typically analyzed in Speaker Diarization benchmarks. First, the problems inherent to this task are analyzed. Then, we propose an approach that consists of a novel initialization parameter estimation method for typical state-of-the-art diarization approaches. The estimation method balances the relationship between the optimal value of the duration of speech data per Gaussian and the duration of the speech data, which is verified experimentally for the first time in this article. As a result, the Diarization Error Rate for short meetings extracted from the 2006, 2007, and 2009 NIST RT evaluation data is decreased by up to 50 \% relative.},
            pdf = {https://publications.idiap.ch/attachments/reports/2009/Imseng_Idiap-RR-26-2009.pdf}
}