<?xml version="1.0" encoding="UTF-8"?>
<collection xmlns="http://www.loc.gov/MARC21/slim">
	<record>
		<datafield tag="980" ind1=" " ind2=" ">
			<subfield code="a">CONF</subfield>
		</datafield>
		<datafield tag="970" ind1=" " ind2=" ">
			<subfield code="a">Friedland_ACMMM_2009/IDIAP</subfield>
		</datafield>
		<datafield tag="245" ind1=" " ind2=" ">
			<subfield code="a">Visual Speaker Localization Aided by Acoustic Models</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Friedland, Gerald</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Yeo, Chuohao</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Hung, Hayley</subfield>
		</datafield>
		<datafield tag="711" ind1="2" ind2=" ">
			<subfield code="a">ACM Multimedia</subfield>
		</datafield>
		<datafield tag="260" ind1=" " ind2=" ">
			<subfield code="c">2009</subfield>
		</datafield>
		<datafield tag="520" ind1=" " ind2=" ">
			<subfield code="a">The following paper presents a novel audio-visual approach
for unsupervised speaker locationing. Using recordings from
a single, low-resolution room overview camera and a single
far-field microphone, a state-of-the art audio-only speaker
localization system (traditionally called speaker diarization)
is extended so that both acoustic and visual models are estimated
as part of a joint unsupervised optimization problem.
The speaker diarization system first automatically determines
the number of speakers and estimates â€œwho spoke
whenâ€, then, in a second step, the visual models are used to
infer the location of the speakers in the video. The experiments
were performed on real-world meetings using 4.5 hours
of the publicly available AMI meeting corpus. The proposed
system is able to exploit audio-visual integration to
not only improve the accuracy of a state-of-the-art (audioonly)
speaker diarization, but also adds visual speaker locationing
at little incremental engineering and computation
costs.</subfield>
		</datafield>
	</record>
</collection>