BibTeX record journals/corr/abs-2404-00978

download as .bib file

@article{DBLP:journals/corr/abs-2404-00978,
  author       = {Hang Zhou and
                  Chenglong Wang and
                  Yimin Hu and
                  Tong Xiao and
                  Chunliang Zhang and
                  Jingbo Zhu},
  title        = {Prior Constraints-based Reward Model Training for Aligning Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2404.00978},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.00978},
  doi          = {10.48550/ARXIV.2404.00978},
  eprinttype    = {arXiv},
  eprint       = {2404.00978},
  timestamp    = {Wed, 08 May 2024 17:22:41 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-00978.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}