BibTeX record journals/corr/abs-2206-05357

download as .bib file

@article{DBLP:journals/corr/abs-2206-05357,
  author       = {Ruida Zhou and
                  Tao Liu and
                  Dileep M. Kalathil and
                  P. R. Kumar and
                  Chao Tian},
  title        = {Anchor-Changing Regularized Natural Policy Gradient for Multi-Objective
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2206.05357},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.05357},
  doi          = {10.48550/ARXIV.2206.05357},
  eprinttype    = {arXiv},
  eprint       = {2206.05357},
  timestamp    = {Mon, 20 Jun 2022 12:59:17 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-05357.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}