%Aigaion2 BibTeX export from Idiap Publications %Wednesday 20 November 2024 07:50:32 PM @INPROCEEDINGS{motlicek:mlmi:2007, author = {Motlicek, Petr and Hermansky, Hynek and Ganapathy, Sriram and Garudadri, Harinath}, projects = {Idiap}, title = {Frequency Domain Linear Prediction for QMF Sub-bands and Applications to Audio Coding}, booktitle = {4th Joint Workshop on Multimodal Interaction and Related Machine Learning Algorithms ({MLMI})}, year = {2007}, note = {IDIAP-RR 07-16}, crossref = {motlicek:rr07-16}, abstract = {This paper proposes an analysis technique for wide-band audio applications based on the predictability of the temporal evolution of Quadrature Mirror Filter (QMF) sub-band signals. The input audio signal is first decomposed into 64 sub-band signals using QMF decomposition. The temporal envelopes in critically sampled QMF sub-bands are approximated using frequency domain linear prediction applied over relatively long time segments (e.g. 1000 ms). Line Spectral Frequency parameters related to autoregressive models are computed and quantized in each frequency sub-band. The sub-band residuals are quantized in the frequency domain using a combination of split Vector Quantization (VQ) (for magnitudes) and uniform scalar quantization (for phases). In the decoder, the sub-band signal is reconstructed using the quantized residual and the corresponding quantized envelope. Finally, application of inverse QMF reconstructs the audio signal. Even with simple quantization techniques and without any sophisticated modules, the proposed audio coder provides encouraging results in objective quality tests. Also, the proposed coder is easily scalable across a wide range of bit-rates.}, pdf = {https://publications.idiap.ch/attachments/papers/2007/motlicek-mlmi-2007.pdf}, postscript = {ftp://ftp.idiap.ch/pub/papers/2007/motlicek-mlmi-2007.ps.gz}, ipdmembership={speech}, } crossreferenced publications: @TECHREPORT{motlicek:rr07-16, author = {Motlicek, Petr and Ganapathy, Sriram and Hermansky, Hynek and Garudadri, Harinath}, projects = {Idiap}, title = {Scalable Wide-band Audio Codec based on Frequency Domain Linear Prediction}, type = {Idiap-RR}, number = {Idiap-RR-16-2007}, year = {2007}, institution = {IDIAP}, abstract = {This paper proposes a technique for wide-band audio applications based on the predictability of the temporal evolution of Quadrature Mirror Filter (QMF) sub-band signals. An input audio signal is first decomposed into 64 frequency sub-band signals using QMF decomposition. The temporal envelopes in critically sampled QMF sub-bands are approximated using frequency domain linear prediction applied over relatively long time segments (e.g. $1000$ ms). Line Spectral Frequency parameters related to autoregressive models are computed and quantized in each frequency sub-band. The sub-band residual signals are quantized in the frequency domain using a split Vector Quantization (VQ) technique. In the decoder, the sub-band signal is reconstructed using the quantized residual and the corresponding quantized envelope. Finally, application of inverse QMF reconstructs the audio signal. Even with simple quantization techniques and without any psychoacoustic model, the proposed audio coder provides encouraging results on objective quality tests.}, pdf = {https://publications.idiap.ch/attachments/reports/2007/motlicek-idiap-rr-07-16.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2007/motlicek-idiap-rr-07-16.ps.gz}, ipdmembership={speech}, }