<?xml version="1.0" encoding="UTF-8"?>
<collection xmlns="http://www.loc.gov/MARC21/slim">
	<record>
		<datafield tag="980" ind1=" " ind2=" ">
			<subfield code="a">CONF</subfield>
		</datafield>
		<datafield tag="970" ind1=" " ind2=" ">
			<subfield code="a">Gay_CBMI_2014/IDIAP</subfield>
		</datafield>
		<datafield tag="245" ind1=" " ind2=" ">
			<subfield code="a">Comparison of Two Methods for Unsupervised Person Identification in TV Shows</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Gay, Paul</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Dupuy, Gregor</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Odobez, Jean-Marc</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Meignier, Sylvain</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Deleglise, Paul</subfield>
		</datafield>
		<datafield tag="653" ind1="1" ind2=" ">
			<subfield code="a">Content-based multimedia indexing</subfield>
		</datafield>
		<datafield tag="653" ind1="1" ind2=" ">
			<subfield code="a">Face dirarization</subfield>
		</datafield>
		<datafield tag="653" ind1="1" ind2=" ">
			<subfield code="a">person diarization</subfield>
		</datafield>
		<datafield tag="711" ind1="2" ind2=" ">
			<subfield code="a">12th International Workshop on Content-Based Multimedia Indexing</subfield>
		</datafield>
		<datafield tag="260" ind1=" " ind2=" ">
			<subfield code="c">2014</subfield>
		</datafield>
		<datafield tag="520" ind1=" " ind2=" ">
			<subfield code="a">We address the task of identifying people appearing
in TV shows. The target persons are all people whose identity
is said or written, like the journalists and the well known
people, as politicians, athletes, celebrities, etc. In our approach,
overlaid names displayed on the images are used to identify the
persons without any use of biometric models for the speakers
and the faces. Two identification methods are evaluated as part
of the REPERE French evaluation campaign. The first one
relies on co-occurrence times between overlay person names and
speaker/face clusters, and rule-based decisions which assign a
name to each monomodal cluster. The second method uses a
Conditionnal Random Field (CRF) which combine different types
of co-occurrence statistics and pair-wised constraints to jointly
identify speakers and faces.</subfield>
		</datafield>
	</record>
</collection>