%Aigaion2 BibTeX export from Idiap Publications
%Friday 05 December 2025 03:44:05 PM
@TECHREPORT{dimitrak-bengio_04-72,
author = {Dimitrakakis, Christos and Bengio, Samy},
projects = {Idiap},
title = {Estimates of Parameter Distributions for Optimal Action Selection},
type = {Idiap-RR},
number = {Idiap-RR-72-2004},
year = {2004},
institution = {IDIAP},
abstract = {We present a general method for maintaining estimates of the distribution of parameters in arbitrary models. This is then applied to the estimation of probability distribution over actions in value-based reinforcement learning. While this approach is similar to other techniques that maintain a confidence measure for action-values, it nevertheless offers a new insight into current techniques and reveals potential avenues of further research.},
pdf = {https://publications.idiap.ch/attachments/reports/2004/rr-04-72.pdf},
postscript = {ftp://ftp.idiap.ch/pub/reports/2004/rr-04-72.ps.gz},
ipdmembership={learning},
}