%Aigaion2 BibTeX export from Idiap Publications %Wednesday 20 November 2024 06:40:42 PM @INPROCEEDINGS{Motlicek_TSD2008_2008, author = {Motlicek, Petr and Ganapathy, Sriram and Hermansky, Hynek and Garudadri, Harinath and Athineos, Marios}, keywords = {Audio Coding, Frequency Domain Linear Prediction (FDLP), speech coding}, projects = {Idiap}, month = {9}, title = {Perceptually motivated Sub-band Decomposition for FDLP Audio Coding}, booktitle = {Text, Speech and Dialogue}, series = {Series of Lecture Notes in Artificial Intelligence (LNAI)}, volume = {5246}, year = {2008}, publisher = {Springer-Verlag Berlin, Heidelberg}, location = {Brno, Czech Republic}, isbn = {978-3-540-87390-7}, abstract = {This paper describes employment of non-uniform QMF decomposition to increase the efficiency of a generic wide-band audio coding system based on Frequency Domain Linear Prediction (FDLP). The base line FDLP codec, operating at high bit-rates (~136 kbps,',','), exploits a uniform QMF decomposition into 64 sub-bands followed by sub-band processing based on FDLP. Here, we propose a non-uniform QMF decomposition into 32 frequency sub-bands obtained by merging 64 uni- form QMF bands. The merging operation is performed in such a way that bandwidths of the resulting critically sampled sub-bands emulate the characteristics of the critical band filters in the human auditory system. Such frequency decomposition, when employed in the FDLP audio codec, results in a bit-rate reduction of 40\% over the base line. We also describe the complete audio codec, which provides high-fidelity audio compression at ~66 kbps. In subjective listening tests, the FDLP codec outperforms MPEG-1 Layer 3 (MP3) and achieves similar qualities as MPEG-4 HE-AAC codec.}, pdf = {https://publications.idiap.ch/attachments/papers/2008/Motlicek_TSD2008_2008.pdf} }