%Aigaion2 BibTeX export from Idiap Publications
%Thursday 26 December 2024 05:11:13 PM

@TECHREPORT{dimitrak-bengio_04-72,
         author = {Dimitrakakis, Christos and Bengio, Samy},
       projects = {Idiap},
          title = {Estimates of Parameter Distributions for Optimal Action Selection},
           type = {Idiap-RR},
         number = {Idiap-RR-72-2004},
           year = {2004},
    institution = {IDIAP},
       abstract = {We present a general method for maintaining estimates of the distribution of parameters in arbitrary models. This is then applied to the estimation of probability distribution over actions in value-based reinforcement learning. While this approach is similar to other techniques that maintain a confidence measure for action-values, it nevertheless offers a new insight into current techniques and reveals potential avenues of further research.},
            pdf = {https://publications.idiap.ch/attachments/reports/2004/rr-04-72.pdf},
     postscript = {ftp://ftp.idiap.ch/pub/reports/2004/rr-04-72.ps.gz},
ipdmembership={learning},
}