BibTeX record journals/corr/abs-2002-02829

download as .bib file

@article{DBLP:journals/corr/abs-2002-02829,
  author       = {Zhimin Hou and
                  Kuangen Zhang and
                  Yi Wan and
                  Dongyu Li and
                  Chenglong Fu and
                  Haoyong Yu},
  title        = {Off-policy Maximum Entropy Reinforcement Learning : Soft Actor-Critic
                  with Advantage Weighted Mixture Policy(SAC-AWMP)},
  journal      = {CoRR},
  volume       = {abs/2002.02829},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02829},
  eprinttype    = {arXiv},
  eprint       = {2002.02829},
  timestamp    = {Sat, 23 Jan 2021 01:12:59 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02829.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics