BibTeX record journals/corr/abs-2010-01404

download as .bib file

@article{DBLP:journals/corr/abs-2010-01404,
  author       = {Masahiro Kato and
                  Kei Nakagawa},
  title        = {Policy Gradient with Expected Quadratic Utility Maximization: {A}
                  New Mean-Variance Approach in Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2010.01404},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.01404},
  eprinttype    = {arXiv},
  eprint       = {2010.01404},
  timestamp    = {Thu, 14 Oct 2021 09:14:18 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-01404.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics