BibTeX record journals/corr/abs-2212-04720

download as .bib file

@article{DBLP:journals/corr/abs-2212-04720,
  author       = {Joey Hong and
                  Branislav Kveton and
                  Sumeet Katariya and
                  Manzil Zaheer and
                  Mohammad Ghavamzadeh},
  title        = {Multi-Task Off-Policy Learning from Bandit Feedback},
  journal      = {CoRR},
  volume       = {abs/2212.04720},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.04720},
  doi          = {10.48550/ARXIV.2212.04720},
  eprinttype    = {arXiv},
  eprint       = {2212.04720},
  timestamp    = {Mon, 02 Jan 2023 15:09:55 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-04720.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics