BibTeX record journals/tai/PilarskiPV22

download as .bib file

@article{DBLP:journals/tai/PilarskiPV22,
  author       = {Sebastian Pilarski and
                  Slawomir Pilarski and
                  D{\'{a}}niel Varr{\'{o}}},
  title        = {Delayed Reward Bernoulli Bandits: Optimal Policy and Predictive Meta-Algorithm
                  {PARDI}},
  journal      = {{IEEE} Trans. Artif. Intell.},
  volume       = {3},
  number       = {2},
  pages        = {152--163},
  year         = {2022},
  url          = {https://doi.org/10.1109/TAI.2021.3117743},
  doi          = {10.1109/TAI.2021.3117743},
  timestamp    = {Thu, 27 Jul 2023 08:18:58 +0200},
  biburl       = {https://dblp.org/rec/journals/tai/PilarskiPV22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}