%Aigaion2 BibTeX export from Idiap Publications %Monday 30 December 2024 06:32:08 PM @ARTICLE{cemgil-kappen-barber-2004, author = {Cemgil, A. T. and Kappen, B. and Barber, David}, projects = {Idiap}, title = {{A Generative Model for Music Transcription}}, journal = {{IEEE Transactions on Speech and Audio Processing}}, year = {2004}, note = {Accepted for publication}, crossref = {barber:rr05-89}, abstract = {In this paper we present a graphical model for polyphonic music transcription. Our model, formulated as a Dynamical Bayesian Network, embodies a transparent and computationally tractable approach to this acoustic analysis problem. An advantage of our approach is that it places emphasis on explicitly modelling the sound generation procedure. It provides a clear framework in which both high level (cognitive) prior information on music structure can be coupled with low level (acoustic physical) information in a principled manner to perform the analysis. The model is a special case of the, generally intractable, switching Kalman filter model. Where possible, we derive, exact polynomial time inference procedures, and otherwise efficient approximations. We argue that our generative model based approach is computationally feasible for many music applications and is readily extensible to more general auditory scene analysis scenarios.}, pdf = {https://publications.idiap.ch/attachments/papers/2005/pianoroll_tsap_final.pdf}, postscript = {ftp://ftp.idiap.ch/pub/papers/2005/pianoroll_tsap_final.ps.gz}, ipdmembership={learning}, } crossreferenced publications: @TECHREPORT{barber:rr05-89, author = {Cemgil, A. T. and Kappen, B. and Barber, David}, projects = {Idiap}, title = {{A Generative Model for Music Transcription}}, type = {Idiap-RR}, number = {Idiap-RR-89-2005}, year = {2005}, institution = {IDIAP}, note = {Accepted to IEEE Transactions on Speech and Audio Processing}, abstract = {In this paper we present a graphical model for polyphonic music transcription. Our model, formulated as a Dynamical Bayesian Network, embodies a transparent and computationally tractable approach to this acoustic analysis problem. An advantage of our approach is that it places emphasis on explicitly modelling the sound generation procedure. It provides a clear framework in which both high level (cognitive) prior information on music structure can be coupled with low level (acoustic physical) information in a principled manner to perform the analysis. The model is a special case of the, generally intractable, switching Kalman filter model. Where possible, we derive, exact polynomial time inference procedures, and otherwise efficient approximations. We argue that our generative model based approach is computationally feasible for many music applications and is readily extensible to more general auditory scene analysis scenarios.}, pdf = {https://publications.idiap.ch/attachments/reports/2005/barber-idiap-rr-05-89.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2005/barber-idiap-rr-05-89.ps.gz}, ipdmembership={learning}, }