<?xml version="1.0" encoding="UTF-8"?>
<collection xmlns="http://www.loc.gov/MARC21/slim">
	<record>
		<datafield tag="980" ind1=" " ind2=" ">
			<subfield code="a">REPORT</subfield>
		</datafield>
		<datafield tag="970" ind1=" " ind2=" ">
			<subfield code="a">Pinto_Idiap-RR-39-2010/IDIAP</subfield>
		</datafield>
		<datafield tag="245" ind1=" " ind2=" ">
			<subfield code="a">Hierarchical Tandem Features for ASR in Mandarin</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Pinto, Joel Praveen</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Magimai-Doss, Mathew</subfield>
		</datafield>
		<datafield tag="700" ind1=" " ind2=" ">
			<subfield code="a">Bourlard, Hervé</subfield>
		</datafield>
		<datafield tag="856" ind1="4" ind2="0">
			<subfield code="i">EXTERNAL</subfield>
			<subfield code="u">http://publications.idiap.ch/attachments/reports/2010/Pinto_Idiap-RR-39-2010.pdf</subfield>
			<subfield code="x">PUBLIC</subfield>
		</datafield>
		<datafield tag="088" ind1=" " ind2=" ">
			<subfield code="a">Idiap-RR-39-2010</subfield>
		</datafield>
		<datafield tag="260" ind1=" " ind2=" ">
			<subfield code="c">2010</subfield>
			<subfield code="b">Idiap</subfield>
		</datafield>
		<datafield tag="771" ind1="2" ind2=" ">
			<subfield code="d">November 2010</subfield>
		</datafield>
		<datafield tag="520" ind1=" " ind2=" ">
			<subfield code="a">We apply multilayer perceptron (MLP) based hierarchical Tandem
features to large vocabulary continuous speech recognition in Mandarin.
Hierarchical Tandem features are estimated using a cascade
of two MLP classifiers which are trained independently. The first
classifier is trained on perceptual linear predictive coefficients with
a 90 ms temporal context. The second classifier is trained using the
phonetic class conditional probabilities estimated by the first MLP,
but with a relatively longer temporal context of about 150 ms. Experiments
on the Mandarin DARPA GALE eval06 dataset show significant
reduction (about 7.6% relative) in character error rates by using
hierarchical Tandem features over conventional Tandem features.</subfield>
		</datafield>
	</record>
</collection>