%Aigaion2 BibTeX export from Idiap Publications
%Monday 29 April 2024 03:42:43 PM

@INPROCEEDINGS{lathoud04b,
         author = {Lathoud, Guillaume and McCowan, Iain A.},
       projects = {Idiap},
          month = {10},
          title = {{A} {S}ector-{B}ased Approach for {L}ocalization of {M}ultiple {S}peakers with {M}icrophone Arrays},
      booktitle = {{P}roceedings of the 2004 {SAPA} {W}orkshop},
           year = {2004},
        address = {Jeju Island, Korea},
           note = {IDIAP-RR 04-15},
       crossref = {lathoud-rr-04-15},
       abstract = {Microphone arrays are useful in meeting rooms, where speech needs to be acquired and segmented. For example, automatic speech segmentation allows enhanced browsing experience, and facilitates automatic analysis of large amounts of data. Spontaneous multi-party speech includes many overlaps between speakers; moreover other audio sources such as laptops and projectors can be active. For these reasons, locating multiple wideband sources in a reasonable amount of time is highly desirable. In existing multisource localization approaches, search initialization is very often an issue left open. We propose here a methodology for estimating speech activity in a given sector of the space rather than at a particular point. In experiments on more than one hour of speech from real meeting room multisource recordings, we show that the sector-based greatly reduces the search space. At the same time, it achieves effective localization of multiple concurrent speakers.},
            pdf = {https://publications.idiap.ch/attachments/papers/2004/lathoud04b.pdf},
     postscript = {ftp://ftp.idiap.ch/pub/papers/2004/lathoud04b.ps.gz},
ipdinar={2004},
ipdmembership={speech},
}



crossreferenced publications: 
@TECHREPORT{lathoud-rr-04-15,
         author = {Lathoud, Guillaume and McCowan, Iain A.},
       projects = {Idiap},
          title = {{A} {S}ector-{B}ased Approach for {L}ocalization of {M}ultiple {S}peakers with {M}icrophone Arrays},
           type = {Idiap-RR},
         number = {Idiap-RR-15-2004},
           year = {2004},
    institution = {IDIAP},
        address = {Martigny, Switzerland},
           note = {Published in ``Proceedings of the 2004 SAPA Workshop''},
       abstract = {Microphone arrays are useful in meeting rooms, where speech needs to be acquired and segmented. For example, automatic speech segmentation allows enhanced browsing experience, and facilitates automatic analysis of large amounts of data. Spontaneous multi-party speech includes many overlaps between speakers; moreover other audio sources such as laptops and projectors can be active. For these reasons, locating multiple wideband sources in a reasonable amount of time is highly desirable. In existing multisource localization approaches, search initialization is very often an issue left open. We propose here a methodology for estimating speech activity in a given sector of the space rather than at a particular point. In experiments on more than one hour of speech from real meeting room multisource recordings, we show that the sector-based greatly reduces the search space. At the same time, it achieves effective localization of multiple concurrent speakers.},
            pdf = {https://publications.idiap.ch/attachments/reports/2004/rr-04-15.pdf},
     postscript = {ftp://ftp.idiap.ch/pub/reports/2004/rr-04-15.ps.gz},
ipdinar={2004},
ipdmembership={speech},
language={English},
}