BibTeX record journals/corr/abs-2205-10047

download as .bib file

@article{DBLP:journals/corr/abs-2205-10047,
  author       = {Xing Chen and
                  Dongcui Diao and
                  Hechang Chen and
                  Hengshuai Yao and
                  Jielong Yang and
                  Haiyin Piao and
                  Zhixiao Sun and
                  Bei Jiang and
                  Yi Chang},
  title        = {Sigmoidally Preconditioned Off-policy Learning: a new exploration
                  method for reinforcement learning},
  journal      = {CoRR},
  volume       = {abs/2205.10047},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.10047},
  doi          = {10.48550/ARXIV.2205.10047},
  eprinttype    = {arXiv},
  eprint       = {2205.10047},
  timestamp    = {Tue, 18 Oct 2022 14:07:19 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-10047.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}