%Aigaion2 BibTeX export from Idiap Publications
%Friday 05 December 2025 03:44:05 PM

@TECHREPORT{dimitrak-bengio_04-72,
                      author = {Dimitrakakis, Christos and Bengio, Samy},
                    projects = {Idiap},
                       title = {Estimates of Parameter Distributions for Optimal Action Selection},
                        type = {Idiap-RR},
                      number = {Idiap-RR-72-2004},
                        year = {2004},
                 institution = {IDIAP},
                    abstract = {We present a general method for maintaining estimates of the distribution of parameters in arbitrary models. This is then applied to the estimation of probability distribution over actions in value-based reinforcement learning. While this approach is similar to other techniques that maintain a confidence measure for action-values, it nevertheless offers a new insight into current techniques and reveals potential avenues of further research.},
                         pdf = {https://publications.idiap.ch/attachments/reports/2004/rr-04-72.pdf},
                  postscript = {ftp://ftp.idiap.ch/pub/reports/2004/rr-04-72.ps.gz},
ipdmembership={learning},
}