BibTeX record conf/uai/WeaverT01

download as .bib file

@inproceedings{DBLP:conf/uai/WeaverT01,
  author       = {Lex Weaver and
                  Nigel Tao},
  editor       = {Jack S. Breese and
                  Daphne Koller},
  title        = {The Optimal Reward Baseline for Gradient-Based Reinforcement Learning},
  booktitle    = {{UAI} '01: Proceedings of the 17th Conference in Uncertainty in Artificial
                  Intelligence, University of Washington, Seattle, Washington, USA,
                  August 2-5, 2001},
  pages        = {538--545},
  publisher    = {Morgan Kaufmann},
  year         = {2001},
  url          = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&smnu=2\&article\_id=141\&proceeding\_id=17},
  timestamp    = {Wed, 03 Feb 2021 11:09:50 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/WeaverT01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics