<?xml version="1.0" encoding="UTF-8"?>
<collection xmlns="http://www.loc.gov/MARC21/slim">
	<record>
		<datafield tag="980" ind1=" " ind2=" ">
			<subfield code="a">REPORT</subfield>
		</datafield>
		<datafield tag="970" ind1=" " ind2=" ">
			<subfield code="a">Motlicek_Idiap-RR-20-2012/IDIAP</subfield>
		</datafield>
		<datafield tag="245" ind1=" " ind2=" ">
			<subfield code="a">Application of Subspace Gaussian Mixture Models in Contrastive Acoustic Scenarios</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Motlicek, Petr</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Garner, Philip N.</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Imseng, David</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Valente, Fabio</subfield>
		</datafield>
		<datafield tag="653" ind1="1" ind2=" ">
			<subfield code="a">acoustic modeling</subfield>
		</datafield>
		<datafield tag="653" ind1="1" ind2=" ">
			<subfield code="a">Automatic Speech Recognition</subfield>
		</datafield>
		<datafield tag="653" ind1="1" ind2=" ">
			<subfield code="a">Subs-ace Gaussian Mixture Models</subfield>
		</datafield>
		<datafield tag="856" ind1="4" ind2="0">
			<subfield code="i">EXTERNAL</subfield>
			<subfield code="u">http://publications.idiap.ch/attachments/reports/2012/Motlicek_Idiap-RR-20-2012.pdf</subfield>
			<subfield code="x">PUBLIC</subfield>
		</datafield>
		<datafield tag="088" ind1=" " ind2=" ">
			<subfield code="a">Idiap-RR-20-2012</subfield>
		</datafield>
		<datafield tag="260" ind1=" " ind2=" ">
			<subfield code="c">2012</subfield>
			<subfield code="b">Idiap</subfield>
			<subfield code="a">Rue Marconi 19, Martigny, Switzerland</subfield>
		</datafield>
		<datafield tag="771" ind1="2" ind2=" ">
			<subfield code="d">July 2012</subfield>
		</datafield>
		<datafield tag="520" ind1=" " ind2=" ">
			<subfield code="a">This paper describes experimental results of applying Subspace
Gaussian Mixture Models (SGMMs) in two completely diverse
acoustic scenarios: (a) for Large Vocabulary Continuous
Speech Recognition (LVCSR) task over (well-resourced)
English meeting data and, (b) for acoustic modeling of underresourced
Afrikaans telephone data. In both cases, the performance
of SGMM models is compared with a conventional
context-dependent HMM/GMM approach exploiting the same
kind of information available during the training. LVCSR
systems are evaluated on standard NIST Rich Transcription
dataset. For under-resourced Afrikaans, SGMM and
HMM/GMM acoustic systems are additionally compared to
KL-HMM and multilingual Tandem techniques boosted using
supplemental out-of-domain data. Experimental results clearly
show that the SGMMapproach (having considerably less model
parameters) outperforms conventional HMM/GMM system in
both scenarios and for all examined training conditions. In case
of under-resourced scenario, the SGMM trained only using indomain
data is superior to other tested approaches boosted by
data from other domain.</subfield>
		</datafield>
	</record>
</collection>