BibTeX record journals/corr/abs-2102-00030

download as .bib file

@article{DBLP:journals/corr/abs-2102-00030,
  author    = {Joseph Lubars and
               Anna Winnicki and
               Michael Livesay and
               R. Srikant},
  title     = {Optimistic Policy Iteration for MDPs with Acyclic Transient State
               Structure},
  journal   = {CoRR},
  volume    = {abs/2102.00030},
  year      = {2021},
  url       = {https://arxiv.org/abs/2102.00030},
  eprinttype = {arXiv},
  eprint    = {2102.00030},
  timestamp = {Tue, 09 Feb 2021 13:35:56 +0100},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2102-00030.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics