BibTeX record journals/corr/abs-2006-12620

download as .bib file

@article{DBLP:journals/corr/abs-2006-12620,
  author       = {Nevena Lazic and
                  Dong Yin and
                  Mehrdad Farajtabar and
                  Nir Levine and
                  Dilan G{\"{o}}r{\"{u}}r and
                  Chris Harris and
                  Dale Schuurmans},
  title        = {A maximum-entropy approach to off-policy evaluation in average-reward
                  MDPs},
  journal      = {CoRR},
  volume       = {abs/2006.12620},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.12620},
  eprinttype    = {arXiv},
  eprint       = {2006.12620},
  timestamp    = {Wed, 01 Jul 2020 15:21:23 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-12620.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics