BibTeX record journals/corr/abs-2104-06139

download as .bib file

@article{DBLP:journals/corr/abs-2104-06139,
  author    = {Chao Xu and
               Yiping Xie and
               Xijun Wang and
               Howard H. Yang and
               Dusit Niyato and
               Tony Q. S. Quek},
  title     = {Optimizing the Long-Term Average Reward for Continuing MDPs: {A} Technical
               Report},
  journal   = {CoRR},
  volume    = {abs/2104.06139},
  year      = {2021},
  url       = {https://arxiv.org/abs/2104.06139},
  archivePrefix = {arXiv},
  eprint    = {2104.06139},
  timestamp = {Fri, 14 May 2021 08:28:36 +0200},
  biburl    = {https://dblp.org/rec/journals/corr/abs-2104-06139.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
a service of Schloss Dagstuhl - Leibniz Center for Informatics