%Aigaion2 BibTeX export from Idiap Publications %Thursday 26 December 2024 05:11:13 PM @TECHREPORT{dimitrak-bengio_04-72, author = {Dimitrakakis, Christos and Bengio, Samy}, projects = {Idiap}, title = {Estimates of Parameter Distributions for Optimal Action Selection}, type = {Idiap-RR}, number = {Idiap-RR-72-2004}, year = {2004}, institution = {IDIAP}, abstract = {We present a general method for maintaining estimates of the distribution of parameters in arbitrary models. This is then applied to the estimation of probability distribution over actions in value-based reinforcement learning. While this approach is similar to other techniques that maintain a confidence measure for action-values, it nevertheless offers a new insight into current techniques and reveals potential avenues of further research.}, pdf = {https://publications.idiap.ch/attachments/reports/2004/rr-04-72.pdf}, postscript = {ftp://ftp.idiap.ch/pub/reports/2004/rr-04-72.ps.gz}, ipdmembership={learning}, }