BibTeX record journals/corr/abs-2402-12034

download as .bib file

@article{DBLP:journals/corr/abs-2402-12034,
  author       = {Davide Mambelli and
                  Stephan Bongers and
                  Onno Zoeter and
                  Matthijs T. J. Spaan and
                  Frans A. Oliehoek},
  title        = {When Do Off-Policy and On-Policy Policy Gradient Methods Align?},
  journal      = {CoRR},
  volume       = {abs/2402.12034},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.12034},
  doi          = {10.48550/ARXIV.2402.12034},
  eprinttype    = {arXiv},
  eprint       = {2402.12034},
  timestamp    = {Fri, 22 Mar 2024 14:48:14 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-12034.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics