BibTeX records: Theophane Weber

download as .bib file

@inproceedings{DBLP:conf/iclr/KeCWBGRWBMR23,
  author       = {Nan Rosemary Ke and
                  Silvia Chiappa and
                  Jane X. Wang and
                  J{\"{o}}rg Bornschein and
                  Anirudh Goyal and
                  M{\'{e}}lanie Rey and
                  Theophane Weber and
                  Matthew M. Botvinick and
                  Michael Curtis Mozer and
                  Danilo Jimenez Rezende},
  title        = {Learning to Induce Causal Structure},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=hp\_RwhKDJ5},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KeCWBGRWBMR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MesnardCSTRWLGV23,
  author       = {Thomas Mesnard and
                  Wenqi Chen and
                  Alaa Saade and
                  Yunhao Tang and
                  Mark Rowland and
                  Theophane Weber and
                  Clare Lyle and
                  Audrunas Gruslys and
                  Michal Valko and
                  Will Dabney and
                  Georg Ostrovski and
                  Eric Moulines and
                  R{\'{e}}mi Munos},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Quantile Credit Assignment},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {24517--24531},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/mesnard23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/MesnardCSTRWLGV23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/WalkerVLDAWH23,
  author       = {Jacob C. Walker and
                  Eszter V{\'{e}}rtes and
                  Yazhe Li and
                  Gabriel Dulac{-}Arnold and
                  Ankesh Anand and
                  Theophane Weber and
                  Jessica B. Hamrick},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Investigating the Role of Model-Based Learning in Exploration and
                  Transfer},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {35368--35383},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/walker23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/WalkerVLDAWH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-05747,
  author       = {Pol Moreno and
                  Adam R. Kosiorek and
                  Heiko Strathmann and
                  Daniel Zoran and
                  Ros{\'{a}}lia G. Schneider and
                  Bj{\"{o}}rn Winckler and
                  Larisa Markeeva and
                  Th{\'{e}}ophane Weber and
                  Danilo J. Rezende},
  title        = {Laser: Latent Set Representations for 3D Generative Modeling},
  journal      = {CoRR},
  volume       = {abs/2301.05747},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.05747},
  doi          = {10.48550/ARXIV.2301.05747},
  eprinttype    = {arXiv},
  eprint       = {2301.05747},
  timestamp    = {Thu, 19 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-05747.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-04009,
  author       = {Jacob C. Walker and
                  Eszter V{\'{e}}rtes and
                  Yazhe Li and
                  Gabriel Dulac{-}Arnold and
                  Ankesh Anand and
                  Th{\'{e}}ophane Weber and
                  Jessica B. Hamrick},
  title        = {Investigating the role of model-based learning in exploration and
                  transfer},
  journal      = {CoRR},
  volume       = {abs/2302.04009},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.04009},
  doi          = {10.48550/ARXIV.2302.04009},
  eprinttype    = {arXiv},
  eprint       = {2302.04009},
  timestamp    = {Fri, 10 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-04009.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-04798,
  author       = {Andreea Deac and
                  Th{\'{e}}ophane Weber and
                  George Papamakarios},
  title        = {Equivariant MuZero},
  journal      = {CoRR},
  volume       = {abs/2302.04798},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.04798},
  doi          = {10.48550/ARXIV.2302.04798},
  eprinttype    = {arXiv},
  eprint       = {2302.04798},
  timestamp    = {Mon, 13 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-04798.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-05823,
  author       = {Nan Rosemary Ke and
                  Sara{-}Jane Dunn and
                  J{\"{o}}rg Bornschein and
                  Silvia Chiappa and
                  M{\'{e}}lanie Rey and
                  Jean{-}Baptiste Lespiau and
                  Albin Cassirer and
                  Jane X. Wang and
                  Theophane Weber and
                  David G. T. Barrett and
                  Matthew M. Botvinick and
                  Anirudh Goyal and
                  Michael Mozer and
                  Danilo J. Rezende},
  title        = {DiscoGen: Learning to Discover Gene Regulatory Networks},
  journal      = {CoRR},
  volume       = {abs/2304.05823},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.05823},
  doi          = {10.48550/ARXIV.2304.05823},
  eprinttype    = {arXiv},
  eprint       = {2304.05823},
  timestamp    = {Thu, 20 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-05823.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/AnandWLVSOWH22,
  author       = {Ankesh Anand and
                  Jacob C. Walker and
                  Yazhe Li and
                  Eszter V{\'{e}}rtes and
                  Julian Schrittwieser and
                  Sherjil Ozair and
                  Theophane Weber and
                  Jessica B. Hamrick},
  title        = {Procedural generalization by planning with self-supervised world models},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=FmBegXJToY},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/AnandWLVSOWH22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GoyalFBWKBGMHKV22,
  author       = {Anirudh Goyal and
                  Abram L. Friesen and
                  Andrea Banino and
                  Theophane Weber and
                  Nan Rosemary Ke and
                  Adri{\`{a}} Puigdom{\`{e}}nech Badia and
                  Arthur Guez and
                  Mehdi Mirza and
                  Peter C. Humphreys and
                  Ksenia Konyushkova and
                  Michal Valko and
                  Simon Osindero and
                  Timothy P. Lillicrap and
                  Nicolas Heess and
                  Charles Blundell},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Retrieval-Augmented Reinforcement Learning},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {7740--7765},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/goyal22a.html},
  timestamp    = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GoyalFBWKBGMHKV22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/HumphreysGTSWL22,
  author       = {Peter C. Humphreys and
                  Arthur Guez and
                  Olivier Tieleman and
                  Laurent Sifre and
                  Theophane Weber and
                  Timothy P. Lillicrap},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Large-Scale Retrieval for Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/7eca17ef54789b0663cab421f2e9dbf5-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/HumphreysGTSWL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-08417,
  author       = {Anirudh Goyal and
                  Abram L. Friesen and
                  Andrea Banino and
                  Theophane Weber and
                  Nan Rosemary Ke and
                  Adri{\`{a}} Puigdom{\`{e}}nech Badia and
                  Arthur Guez and
                  Mehdi Mirza and
                  Ksenia Konyushkova and
                  Michal Valko and
                  Simon Osindero and
                  Timothy P. Lillicrap and
                  Nicolas Heess and
                  Charles Blundell},
  title        = {Retrieval-Augmented Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2202.08417},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.08417},
  eprinttype    = {arXiv},
  eprint       = {2202.08417},
  timestamp    = {Tue, 01 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-08417.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-04875,
  author       = {Nan Rosemary Ke and
                  Silvia Chiappa and
                  Jane Wang and
                  J{\"{o}}rg Bornschein and
                  Theophane Weber and
                  Anirudh Goyal and
                  Matthew M. Botvinick and
                  Michael Mozer and
                  Danilo Jimenez Rezende},
  title        = {Learning to Induce Causal Structure},
  journal      = {CoRR},
  volume       = {abs/2204.04875},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.04875},
  doi          = {10.48550/ARXIV.2204.04875},
  eprinttype    = {arXiv},
  eprint       = {2204.04875},
  timestamp    = {Mon, 11 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-04875.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-05314,
  author       = {Peter C. Humphreys and
                  Arthur Guez and
                  Olivier Tieleman and
                  Laurent Sifre and
                  Th{\'{e}}ophane Weber and
                  Timothy P. Lillicrap},
  title        = {Large-Scale Retrieval for Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2206.05314},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.05314},
  doi          = {10.48550/ARXIV.2206.05314},
  eprinttype    = {arXiv},
  eprint       = {2206.05314},
  timestamp    = {Mon, 20 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-05314.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HamrickFBGVWABV21,
  author       = {Jessica B. Hamrick and
                  Abram L. Friesen and
                  Feryal M. P. Behbahani and
                  Arthur Guez and
                  Fabio Viola and
                  Sims Witherspoon and
                  Thomas Anthony and
                  Lars Holger Buesing and
                  Petar Velickovic and
                  Theophane Weber},
  title        = {On the role of planning in model-based deep reinforcement learning},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=IrM64DGB21},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/HamrickFBGVWABV21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/HesselDVGSSWSH21,
  author       = {Matteo Hessel and
                  Ivo Danihelka and
                  Fabio Viola and
                  Arthur Guez and
                  Simon Schmitt and
                  Laurent Sifre and
                  Theophane Weber and
                  David Silver and
                  Hado van Hasselt},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Muesli: Combining Improvements in Policy Optimization},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {4214--4226},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/hessel21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/HesselDVGSSWSH21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MesnardWVTSHDSH21,
  author       = {Thomas Mesnard and
                  Theophane Weber and
                  Fabio Viola and
                  Shantanu Thakoor and
                  Alaa Saade and
                  Anna Harutyunyan and
                  Will Dabney and
                  Thomas S. Stepleton and
                  Nicolas Heess and
                  Arthur Guez and
                  Eric Moulines and
                  Marcus Hutter and
                  Lars Buesing and
                  R{\'{e}}mi Munos},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Counterfactual Credit Assignment in Model-Free Reinforcement Learning},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {7654--7664},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/mesnard21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/MesnardWVTSHDSH21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-02274,
  author       = {Pol Moreno and
                  Edward Hughes and
                  Kevin R. McKee and
                  Bernardo {\'{A}}vila Pires and
                  Th{\'{e}}ophane Weber},
  title        = {Neural Recursive Belief States in Multi-Agent Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2102.02274},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.02274},
  eprinttype    = {arXiv},
  eprint       = {2102.02274},
  timestamp    = {Tue, 09 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-02274.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-12425,
  author       = {David Raposo and
                  Samuel Ritter and
                  Adam Santoro and
                  Greg Wayne and
                  Theophane Weber and
                  Matt M. Botvinick and
                  Hado van Hasselt and
                  H. Francis Song},
  title        = {Synthetic Returns for Long-Term Credit Assignment},
  journal      = {CoRR},
  volume       = {abs/2102.12425},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.12425},
  eprinttype    = {arXiv},
  eprint       = {2102.12425},
  timestamp    = {Tue, 02 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-12425.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-06159,
  author       = {Matteo Hessel and
                  Ivo Danihelka and
                  Fabio Viola and
                  Arthur Guez and
                  Simon Schmitt and
                  Laurent Sifre and
                  Theophane Weber and
                  David Silver and
                  Hado van Hasselt},
  title        = {Muesli: Combining Improvements in Policy Optimization},
  journal      = {CoRR},
  volume       = {abs/2104.06159},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.06159},
  eprinttype    = {arXiv},
  eprint       = {2104.06159},
  timestamp    = {Mon, 19 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-06159.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-01587,
  author       = {Ankesh Anand and
                  Jacob C. Walker and
                  Yazhe Li and
                  Eszter V{\'{e}}rtes and
                  Julian Schrittwieser and
                  Sherjil Ozair and
                  Th{\'{e}}ophane Weber and
                  Jessica B. Hamrick},
  title        = {Procedural Generalization by Planning with Self-Supervised World Models},
  journal      = {CoRR},
  volume       = {abs/2111.01587},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.01587},
  eprinttype    = {arXiv},
  eprint       = {2111.01587},
  timestamp    = {Thu, 18 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-01587.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/BuesingHW20,
  author       = {Lars Buesing and
                  Nicolas Heess and
                  Theophane Weber},
  editor       = {Silvia Chiappa and
                  Roberto Calandra},
  title        = {Approximate Inference in Discrete Distributions with Monte Carlo Tree
                  Search and Value Functions},
  booktitle    = {The 23rd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]},
  series       = {Proceedings of Machine Learning Research},
  volume       = {108},
  pages        = {624--634},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v108/buesing20a.html},
  timestamp    = {Mon, 29 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/BuesingHW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icbinb/RoscaWGM20,
  author       = {Mihaela Rosca and
                  Theophane Weber and
                  Arthur Gretton and
                  Shakir Mohamed},
  editor       = {Jessica Zosa Forde and
                  Francisco J. R. Ruiz and
                  Melanie F. Pradier and
                  Aaron Schein},
  title        = {A case for new neural network smoothness constraints},
  booktitle    = {"I Can't Believe It's Not Better!" at NeurIPS Workshops, Virtual,
                  December 12, 2020},
  series       = {Proceedings of Machine Learning Research},
  volume       = {137},
  pages        = {21--32},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {https://proceedings.mlr.press/v137/rosca20a.html},
  timestamp    = {Thu, 14 Jul 2022 17:31:05 +0200},
  biburl       = {https://dblp.org/rec/conf/icbinb/RoscaWGM20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HamrickBSPWBB20,
  author       = {Jessica B. Hamrick and
                  Victor Bapst and
                  Alvaro Sanchez{-}Gonzalez and
                  Tobias Pfaff and
                  Theophane Weber and
                  Lars Buesing and
                  Peter W. Battaglia},
  title        = {Combining Q-Learning and Search with Amortized Value Estimates},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=SkeAaJrKDS},
  timestamp    = {Thu, 07 May 2020 17:11:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/HamrickBSPWBB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GuezVWBKPSH20,
  author       = {Arthur Guez and
                  Fabio Viola and
                  Theophane Weber and
                  Lars Buesing and
                  Steven Kapturowski and
                  Doina Precup and
                  David Silver and
                  Nicolas Heess},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Value-driven Hindsight Modelling},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/9381fc93ad66f9ec4b2eef71147a6665-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GuezVWBKPSH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-02836,
  author       = {Danilo J. Rezende and
                  Ivo Danihelka and
                  George Papamakarios and
                  Nan Rosemary Ke and
                  Ray Jiang and
                  Theophane Weber and
                  Karol Gregor and
                  Hamza Merzic and
                  Fabio Viola and
                  Jane Wang and
                  Jovana Mitrovic and
                  Frederic Besse and
                  Ioannis Antonoglou and
                  Lars Buesing},
  title        = {Causally Correct Partial Models for Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2002.02836},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02836},
  eprinttype    = {arXiv},
  eprint       = {2002.02836},
  timestamp    = {Thu, 28 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02836.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-08329,
  author       = {Arthur Guez and
                  Fabio Viola and
                  Th{\'{e}}ophane Weber and
                  Lars Buesing and
                  Steven Kapturowski and
                  Doina Precup and
                  David Silver and
                  Nicolas Heess},
  title        = {Value-driven Hindsight Modelling},
  journal      = {CoRR},
  volume       = {abs/2002.08329},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.08329},
  eprinttype    = {arXiv},
  eprint       = {2002.08329},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-08329.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-11410,
  author       = {Giambattista Parascandolo and
                  Lars Buesing and
                  Josh Merel and
                  Leonard Hasenclever and
                  John Aslanides and
                  Jessica B. Hamrick and
                  Nicolas Heess and
                  Alexander Neitz and
                  Theophane Weber},
  title        = {Divide-and-Conquer Monte Carlo Tree Search For Goal-Directed Planning},
  journal      = {CoRR},
  volume       = {abs/2004.11410},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.11410},
  eprinttype    = {arXiv},
  eprint       = {2004.11410},
  timestamp    = {Tue, 28 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-11410.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-05524,
  author       = {Mehdi Mirza and
                  Andrew Jaegle and
                  Jonathan J. Hunt and
                  Arthur Guez and
                  Saran Tunyasuvunakool and
                  Alistair Muldal and
                  Th{\'{e}}ophane Weber and
                  P{\'{e}}ter Karkus and
                  S{\'{e}}bastien Racani{\`{e}}re and
                  Lars Buesing and
                  Timothy P. Lillicrap and
                  Nicolas Heess},
  title        = {Physically Embedded Planning Problems: New Challenges for Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2009.05524},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.05524},
  eprinttype    = {arXiv},
  eprint       = {2009.05524},
  timestamp    = {Thu, 17 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-05524.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-01298,
  author       = {P{\'{e}}ter Karkus and
                  Mehdi Mirza and
                  Arthur Guez and
                  Andrew Jaegle and
                  Timothy P. Lillicrap and
                  Lars Buesing and
                  Nicolas Heess and
                  Theophane Weber},
  title        = {Beyond Tabula-Rasa: a Modular Reinforcement Learning Approach for
                  Physically Embedded 3D Sokoban},
  journal      = {CoRR},
  volume       = {abs/2010.01298},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.01298},
  eprinttype    = {arXiv},
  eprint       = {2010.01298},
  timestamp    = {Mon, 12 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-01298.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-04021,
  author       = {Jessica B. Hamrick and
                  Abram L. Friesen and
                  Feryal M. P. Behbahani and
                  Arthur Guez and
                  Fabio Viola and
                  Sims Witherspoon and
                  Thomas Anthony and
                  Lars Buesing and
                  Petar Velickovic and
                  Th{\'{e}}ophane Weber},
  title        = {On the role of planning in model-based deep reinforcement learning},
  journal      = {CoRR},
  volume       = {abs/2011.04021},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.04021},
  eprinttype    = {arXiv},
  eprint       = {2011.04021},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-04021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-09464,
  author       = {Thomas Mesnard and
                  Th{\'{e}}ophane Weber and
                  Fabio Viola and
                  Shantanu Thakoor and
                  Alaa Saade and
                  Anna Harutyunyan and
                  Will Dabney and
                  Tom Stepleton and
                  Nicolas Heess and
                  Arthur Guez and
                  Marcus Hutter and
                  Lars Buesing and
                  R{\'{e}}mi Munos},
  title        = {Counterfactual Credit Assignment in Model-Free Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2011.09464},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.09464},
  eprinttype    = {arXiv},
  eprint       = {2011.09464},
  timestamp    = {Wed, 25 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-09464.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-07969,
  author       = {Mihaela Rosca and
                  Theophane Weber and
                  Arthur Gretton and
                  Shakir Mohamed},
  title        = {A case for new neural network smoothness constraints},
  journal      = {CoRR},
  volume       = {abs/2012.07969},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.07969},
  eprinttype    = {arXiv},
  eprint       = {2012.07969},
  timestamp    = {Tue, 05 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-07969.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/WeberHBS19,
  author       = {Th{\'{e}}ophane Weber and
                  Nicolas Heess and
                  Lars Buesing and
                  David Silver},
  editor       = {Kamalika Chaudhuri and
                  Masashi Sugiyama},
  title        = {Credit Assignment Techniques in Stochastic Computation Graphs},
  booktitle    = {The 22nd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2019, 16-18 April 2019, Naha, Okinawa, Japan},
  series       = {Proceedings of Machine Learning Research},
  volume       = {89},
  pages        = {2650--2660},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v89/weber19a.html},
  timestamp    = {Fri, 07 Jun 2019 09:03:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/WeberHBS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BuesingWZHRGL19,
  author       = {Lars Buesing and
                  Theophane Weber and
                  Yori Zwols and
                  Nicolas Heess and
                  S{\'{e}}bastien Racani{\`{e}}re and
                  Arthur Guez and
                  Jean{-}Baptiste Lespiau},
  title        = {Woulda, Coulda, Shoulda: Counterfactually-Guided Policy Search},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=BJG0voC9YQ},
  timestamp    = {Thu, 25 Jul 2019 13:03:15 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BuesingWZHRGL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GregorPBBW19,
  author       = {Karol Gregor and
                  George Papamakarios and
                  Frederic Besse and
                  Lars Buesing and
                  Theophane Weber},
  title        = {Temporal Difference Variational Auto-Encoder},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=S1x4ghC9tQ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GregorPBBW19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GuezMGKRWRSOEWS19,
  author       = {Arthur Guez and
                  Mehdi Mirza and
                  Karol Gregor and
                  Rishabh Kabra and
                  S{\'{e}}bastien Racani{\`{e}}re and
                  Theophane Weber and
                  David Raposo and
                  Adam Santoro and
                  Laurent Orseau and
                  Tom Eccles and
                  Greg Wayne and
                  David Silver and
                  Timothy P. Lillicrap},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {An Investigation of Model-Free Planning},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {2464--2473},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/guez19a.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GuezMGKRWRSOEWS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-01761,
  author       = {Th{\'{e}}ophane Weber and
                  Nicolas Heess and
                  Lars Buesing and
                  David Silver},
  title        = {Credit Assignment Techniques in Stochastic Computation Graphs},
  journal      = {CoRR},
  volume       = {abs/1901.01761},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.01761},
  eprinttype    = {arXiv},
  eprint       = {1901.01761},
  timestamp    = {Thu, 31 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-01761.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-03559,
  author       = {Arthur Guez and
                  Mehdi Mirza and
                  Karol Gregor and
                  Rishabh Kabra and
                  S{\'{e}}bastien Racani{\`{e}}re and
                  Th{\'{e}}ophane Weber and
                  David Raposo and
                  Adam Santoro and
                  Laurent Orseau and
                  Tom Eccles and
                  Greg Wayne and
                  David Silver and
                  Timothy P. Lillicrap},
  title        = {An investigation of model-free planning},
  journal      = {CoRR},
  volume       = {abs/1901.03559},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.03559},
  eprinttype    = {arXiv},
  eprint       = {1901.03559},
  timestamp    = {Fri, 01 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-03559.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-01007,
  author       = {John F. J. Mellor and
                  Eunbyung Park and
                  Yaroslav Ganin and
                  Igor Babuschkin and
                  Tejas Kulkarni and
                  Dan Rosenbaum and
                  Andy Ballard and
                  Theophane Weber and
                  Oriol Vinyals and
                  S. M. Ali Eslami},
  title        = {Unsupervised Doodling and Painting with Improved {SPIRAL}},
  journal      = {CoRR},
  volume       = {abs/1910.01007},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.01007},
  eprinttype    = {arXiv},
  eprint       = {1910.01007},
  timestamp    = {Fri, 04 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-01007.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-06862,
  author       = {Lars Buesing and
                  Nicolas Heess and
                  Theophane Weber},
  title        = {Approximate Inference in Discrete Distributions with Monte Carlo Tree
                  Search and Value Functions},
  journal      = {CoRR},
  volume       = {abs/1910.06862},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.06862},
  eprinttype    = {arXiv},
  eprint       = {1910.06862},
  timestamp    = {Wed, 16 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-06862.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-02807,
  author       = {Jessica B. Hamrick and
                  Victor Bapst and
                  Alvaro Sanchez{-}Gonzalez and
                  Tobias Pfaff and
                  Theophane Weber and
                  Lars Buesing and
                  Peter W. Battaglia},
  title        = {Combining Q-Learning and Search with Amortized Value Estimates},
  journal      = {CoRR},
  volume       = {abs/1912.02807},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.02807},
  eprinttype    = {arXiv},
  eprint       = {1912.02807},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-02807.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GuezWASVWMS18,
  author       = {Arthur Guez and
                  Theophane Weber and
                  Ioannis Antonoglou and
                  Karen Simonyan and
                  Oriol Vinyals and
                  Daan Wierstra and
                  R{\'{e}}mi Munos and
                  David Silver},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {Learning to Search with MCTSnets},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {1817--1826},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/guez18a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:30 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GuezWASVWMS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/OrseauLLW18,
  author       = {Laurent Orseau and
                  Levi Lelis and
                  Tor Lattimore and
                  Theophane Weber},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Single-Agent Policy Tree Search With Guarantees},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {3205--3215},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/52c5189391854c93e8a0e1326e56c14f-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/OrseauLLW18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SantoroFRRCWWVP18,
  author       = {Adam Santoro and
                  Ryan Faulkner and
                  David Raposo and
                  Jack W. Rae and
                  Mike Chrzanowski and
                  Theophane Weber and
                  Daan Wierstra and
                  Oriol Vinyals and
                  Razvan Pascanu and
                  Timothy P. Lillicrap},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Relational recurrent neural networks},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {7310--7321},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/e2eabaf96372e20a9e3d4b5f83723a61-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SantoroFRRCWWVP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-03006,
  author       = {Lars Buesing and
                  Theophane Weber and
                  S{\'{e}}bastien Racani{\`{e}}re and
                  S. M. Ali Eslami and
                  Danilo Jimenez Rezende and
                  David P. Reichert and
                  Fabio Viola and
                  Frederic Besse and
                  Karol Gregor and
                  Demis Hassabis and
                  Daan Wierstra},
  title        = {Learning and Querying Fast Generative Models for Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1802.03006},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.03006},
  eprinttype    = {arXiv},
  eprint       = {1802.03006},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-03006.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-04697,
  author       = {Arthur Guez and
                  Th{\'{e}}ophane Weber and
                  Ioannis Antonoglou and
                  Karen Simonyan and
                  Oriol Vinyals and
                  Daan Wierstra and
                  R{\'{e}}mi Munos and
                  David Silver},
  title        = {Learning to Search with MCTSnets},
  journal      = {CoRR},
  volume       = {abs/1802.04697},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.04697},
  eprinttype    = {arXiv},
  eprint       = {1802.04697},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-04697.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-01822,
  author       = {Adam Santoro and
                  Ryan Faulkner and
                  David Raposo and
                  Jack W. Rae and
                  Mike Chrzanowski and
                  Theophane Weber and
                  Daan Wierstra and
                  Oriol Vinyals and
                  Razvan Pascanu and
                  Timothy P. Lillicrap},
  title        = {Relational recurrent neural networks},
  journal      = {CoRR},
  volume       = {abs/1806.01822},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.01822},
  eprinttype    = {arXiv},
  eprint       = {1806.01822},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-01822.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-06272,
  author       = {Lars Buesing and
                  Theophane Weber and
                  Yori Zwols and
                  S{\'{e}}bastien Racani{\`{e}}re and
                  Arthur Guez and
                  Jean{-}Baptiste Lespiau and
                  Nicolas Heess},
  title        = {Woulda, Coulda, Shoulda: Counterfactually-Guided Policy Search},
  journal      = {CoRR},
  volume       = {abs/1811.06272},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.06272},
  eprinttype    = {arXiv},
  eprint       = {1811.06272},
  timestamp    = {Sun, 25 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-06272.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-10928,
  author       = {Laurent Orseau and
                  Levi H. S. Lelis and
                  Tor Lattimore and
                  Th{\'{e}}ophane Weber},
  title        = {Single-Agent Policy Tree Search With Guarantees},
  journal      = {CoRR},
  volume       = {abs/1811.10928},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.10928},
  eprinttype    = {arXiv},
  eprint       = {1811.10928},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-10928.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WattersZWBPT17,
  author       = {Nicholas Watters and
                  Daniel Zoran and
                  Theophane Weber and
                  Peter W. Battaglia and
                  Razvan Pascanu and
                  Andrea Tacchetti},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Visual Interaction Networks: Learning a Physics Simulator from Video},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {4539--4547},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/8cbd005a556ccd4211ce43f309bc0eac-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 13:58:27 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WattersZWBPT17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RacaniereWRBGRB17,
  author       = {S{\'{e}}bastien Racani{\`{e}}re and
                  Theophane Weber and
                  David P. Reichert and
                  Lars Buesing and
                  Arthur Guez and
                  Danilo Jimenez Rezende and
                  Adri{\`{a}} Puigdom{\`{e}}nech Badia and
                  Oriol Vinyals and
                  Nicolas Heess and
                  Yujia Li and
                  Razvan Pascanu and
                  Peter W. Battaglia and
                  Demis Hassabis and
                  David Silver and
                  Daan Wierstra},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Imagination-Augmented Agents for Deep Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {5690--5701},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/9e82757e9a1c12cb710ad680db11f6f1-Abstract.html},
  timestamp    = {Sat, 02 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/RacaniereWRBGRB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/WattersTWPBZ17,
  author       = {Nicholas Watters and
                  Andrea Tacchetti and
                  Theophane Weber and
                  Razvan Pascanu and
                  Peter W. Battaglia and
                  Daniel Zoran},
  title        = {Visual Interaction Networks},
  journal      = {CoRR},
  volume       = {abs/1706.01433},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.01433},
  eprinttype    = {arXiv},
  eprint       = {1706.01433},
  timestamp    = {Wed, 24 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/WattersTWPBZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PascanuLVHBRRWW17,
  author       = {Razvan Pascanu and
                  Yujia Li and
                  Oriol Vinyals and
                  Nicolas Heess and
                  Lars Buesing and
                  S{\'{e}}bastien Racani{\`{e}}re and
                  David P. Reichert and
                  Theophane Weber and
                  Daan Wierstra and
                  Peter W. Battaglia},
  title        = {Learning model-based planning from scratch},
  journal      = {CoRR},
  volume       = {abs/1707.06170},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.06170},
  eprinttype    = {arXiv},
  eprint       = {1707.06170},
  timestamp    = {Sat, 02 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/PascanuLVHBRRWW17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/WeberRRBGRBVHLP17,
  author       = {Theophane Weber and
                  S{\'{e}}bastien Racani{\`{e}}re and
                  David P. Reichert and
                  Lars Buesing and
                  Arthur Guez and
                  Danilo Jimenez Rezende and
                  Adri{\`{a}} Puigdom{\`{e}}nech Badia and
                  Oriol Vinyals and
                  Nicolas Heess and
                  Yujia Li and
                  Razvan Pascanu and
                  Peter W. Battaglia and
                  David Silver and
                  Daan Wierstra},
  title        = {Imagination-Augmented Agents for Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1707.06203},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.06203},
  eprinttype    = {arXiv},
  eprint       = {1707.06203},
  timestamp    = {Sat, 02 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/WeberRRBGRBVHLP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-08378,
  author       = {Matthew M. Botvinick and
                  David G. T. Barrett and
                  Peter W. Battaglia and
                  Nando de Freitas and
                  Dharshan Kumaran and
                  Joel Z. Leibo and
                  Tim Lillicrap and
                  Joseph Modayil and
                  S. Mohamed and
                  Neil C. Rabinowitz and
                  Danilo Jimenez Rezende and
                  Adam Santoro and
                  Tom Schaul and
                  Christopher Summerfield and
                  Greg Wayne and
                  Theophane Weber and
                  Daan Wierstra and
                  Shane Legg and
                  Demis Hassabis},
  title        = {Building Machines that Learn and Think for Themselves: Commentary
                  on Lake et al., Behavioral and Brain Sciences, 2017},
  journal      = {CoRR},
  volume       = {abs/1711.08378},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.08378},
  eprinttype    = {arXiv},
  eprint       = {1711.08378},
  timestamp    = {Wed, 20 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-08378.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/dt/ChauhanOKCW16,
  author       = {Hari Chauhan and
                  Marvin Onabajo and
                  Vladimir Kvartenko and
                  Robin Coxe and
                  Theophane Weber},
  title        = {An Optimization Platform for Digital Predistortion of Power Amplifiers},
  journal      = {{IEEE} Des. Test},
  volume       = {33},
  number       = {2},
  pages        = {49--58},
  year         = {2016},
  url          = {https://doi.org/10.1109/MDAT.2015.2480702},
  doi          = {10.1109/MDAT.2015.2480702},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/dt/ChauhanOKCW16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/EslamiHWTSKH16,
  author       = {S. M. Ali Eslami and
                  Nicolas Heess and
                  Theophane Weber and
                  Yuval Tassa and
                  David Szepesvari and
                  Koray Kavukcuoglu and
                  Geoffrey E. Hinton},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {Attend, Infer, Repeat: Fast Scene Understanding with Generative Models},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {3225--3233},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/52947e0ade57a09e4a1386d08f17b656-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/EslamiHWTSKH16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/EslamiHWTKH16,
  author       = {S. M. Ali Eslami and
                  Nicolas Heess and
                  Theophane Weber and
                  Yuval Tassa and
                  Koray Kavukcuoglu and
                  Geoffrey E. Hinton},
  title        = {Attend, Infer, Repeat: Fast Scene Understanding with Generative Models},
  journal      = {CoRR},
  volume       = {abs/1603.08575},
  year         = {2016},
  url          = {http://arxiv.org/abs/1603.08575},
  eprinttype    = {arXiv},
  eprint       = {1603.08575},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/EslamiHWTKH16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SchulmanHWA15,
  author       = {John Schulman and
                  Nicolas Heess and
                  Theophane Weber and
                  Pieter Abbeel},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {Gradient Estimation Using Stochastic Computation Graphs},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {3528--3536},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/de03beffeed9da5f3639a621bcab5dd4-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SchulmanHWA15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SchulmanHWA15,
  author       = {John Schulman and
                  Nicolas Heess and
                  Theophane Weber and
                  Pieter Abbeel},
  title        = {Gradient Estimation Using Stochastic Computation Graphs},
  journal      = {CoRR},
  volume       = {abs/1506.05254},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.05254},
  eprinttype    = {arXiv},
  eprint       = {1506.05254},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SchulmanHWA15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/mor/GamarnikGW14,
  author       = {David Gamarnik and
                  David A. Goldberg and
                  Theophane Weber},
  title        = {Correlation Decay in Random Decision Networks},
  journal      = {Math. Oper. Res.},
  volume       = {39},
  number       = {2},
  pages        = {229--261},
  year         = {2014},
  url          = {https://doi.org/10.1287/moor.2013.0609},
  doi          = {10.1287/MOOR.2013.0609},
  timestamp    = {Sun, 28 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mor/GamarnikGW14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1301-1299,
  author       = {David Wingate and
                  Theophane Weber},
  title        = {Automated Variational Inference in Probabilistic Programming},
  journal      = {CoRR},
  volume       = {abs/1301.1299},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.1299},
  eprinttype    = {arXiv},
  eprint       = {1301.1299},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-1299.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/DauwelsWVMC12,
  author       = {Justin Dauwels and
                  Theophane Weber and
                  Fran{\c{c}}ois B. Vialatte and
                  Toshimitsu Musha and
                  Andrzej Cichocki},
  title        = {Quantifying Statistical Interdependence, Part {III:} \emph{N} {\textgreater}
                  2 Point Processes},
  journal      = {Neural Comput.},
  volume       = {24},
  number       = {2},
  pages        = {408--454},
  year         = {2012},
  url          = {https://doi.org/10.1162/NECO\_a\_00235},
  doi          = {10.1162/NECO\_A\_00235},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/DauwelsWVMC12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1212-2991,
  author       = {Shawn Hershey and
                  Jeffrey Bernstein and
                  Bill Bradley and
                  Andrew Schweitzer and
                  Noah Stein and
                  Theophane Weber and
                  Benjamin Vigoda},
  title        = {Accelerating Inference: towards a full Language, Compiler and Hardware
                  stack},
  journal      = {CoRR},
  volume       = {abs/1212.2991},
  year         = {2012},
  url          = {http://arxiv.org/abs/1212.2991},
  eprinttype    = {arXiv},
  eprint       = {1212.2991},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1212-2991.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/msom/GallienW10,
  author       = {J{\'{e}}r{\'{e}}mie Gallien and
                  Th{\'{e}}ophane Weber},
  title        = {To Wave or Not to Wave? Order Release Policies for Warehouses with
                  an Automated Sorter},
  journal      = {Manuf. Serv. Oper. Manag.},
  volume       = {12},
  number       = {4},
  pages        = {642--662},
  year         = {2010},
  url          = {https://doi.org/10.1287/msom.1100.0291},
  doi          = {10.1287/MSOM.1100.0291},
  timestamp    = {Thu, 01 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/msom/GallienW10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/islped/VigodaRBWB10,
  author       = {Benjamin Vigoda and
                  David Reynolds and
                  Jeffrey Bernstein and
                  Theophane Weber and
                  Bill Bradley},
  editor       = {Vojin G. Oklobdzija and
                  Barry Pangle and
                  Naehyuck Chang and
                  Naresh R. Shanbhag and
                  Chris H. Kim},
  title        = {Low power logic for statistical inference},
  booktitle    = {Proceedings of the 2010 International Symposium on Low Power Electronics
                  and Design, 2010, Austin, Texas, USA, August 18-20, 2010},
  pages        = {349--354},
  publisher    = {{ACM}},
  year         = {2010},
  url          = {https://doi.org/10.1145/1840845.1840918},
  doi          = {10.1145/1840845.1840918},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/islped/VigodaRBWB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/soda/GamarnikGW10,
  author       = {David Gamarnik and
                  David A. Goldberg and
                  Theophane Weber},
  editor       = {Moses Charikar},
  title        = {{PTAS} for Maximum Weight Independent Set Problem with Random Weights
                  in Bounded Degree Graphs},
  booktitle    = {Proceedings of the Twenty-First Annual {ACM-SIAM} Symposium on Discrete
                  Algorithms, {SODA} 2010, Austin, Texas, USA, January 17-19, 2010},
  pages        = {268--278},
  publisher    = {{SIAM}},
  year         = {2010},
  url          = {https://doi.org/10.1137/1.9781611973075.23},
  doi          = {10.1137/1.9781611973075.23},
  timestamp    = {Tue, 02 Feb 2021 17:07:39 +0100},
  biburl       = {https://dblp.org/rec/conf/soda/GamarnikGW10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/DauwelsVWC09,
  author       = {Justin Dauwels and
                  Fran{\c{c}}ois B. Vialatte and
                  Theophane Weber and
                  Andrzej Cichocki},
  title        = {Quantifying Statistical Interdependence by Message Passing on Graphs
                  - Part {I:} One-Dimensional Point Processes},
  journal      = {Neural Comput.},
  volume       = {21},
  number       = {8},
  pages        = {2152--2202},
  year         = {2009},
  url          = {https://doi.org/10.1162/neco.2009.04-08-746},
  doi          = {10.1162/NECO.2009.04-08-746},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/DauwelsVWC09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/DauwelsVWMC09,
  author       = {Justin Dauwels and
                  Fran{\c{c}}ois B. Vialatte and
                  Theophane Weber and
                  Toshimitsu Musha and
                  Andrzej Cichocki},
  title        = {Quantifying Statistical Interdependence by Message Passing on Graphs
                  - Part {II:} Multidimensional Point Processes},
  journal      = {Neural Comput.},
  volume       = {21},
  number       = {8},
  pages        = {2203--2268},
  year         = {2009},
  url          = {https://doi.org/10.1162/neco.2009.11-08-899},
  doi          = {10.1162/NECO.2009.11-08-899},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/DauwelsVWMC09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0912-0338,
  author       = {David Gamarnik and
                  David A. Goldberg and
                  Theophane Weber},
  title        = {Correlation Decay in Random Decision Networks},
  journal      = {CoRR},
  volume       = {abs/0912.0338},
  year         = {2009},
  url          = {http://arxiv.org/abs/0912.0338},
  eprinttype    = {arXiv},
  eprint       = {0912.0338},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0912-0338.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/allerton/DauwelsVWC08,
  author       = {Justin Dauwels and
                  Fran{\c{c}}ois B. Vialatte and
                  Theophane Weber and
                  Andrzej Cichocki},
  title        = {Analyzing brain signals by combinatorial optimization},
  booktitle    = {46th Annual Allerton Conference on Communication, Control, and Computing,
                  Allerton 2008, Monticello, IL, USA, September 24-26, 2008},
  pages        = {1381--1388},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ALLERTON.2008.4797722},
  doi          = {10.1109/ALLERTON.2008.4797722},
  timestamp    = {Sun, 17 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/allerton/DauwelsVWC08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cdc/FariasW08,
  author       = {Daniela Pucci de Farias and
                  Th{\'{e}}ophane Weber},
  title        = {Choosing the cost vector of the linear programming approach to approximate
                  dynamic programming},
  booktitle    = {Proceedings of the 47th {IEEE} Conference on Decision and Control,
                  {CDC} 2008, December 9-11, 2008, Canc{\'{u}}n, Mexico},
  pages        = {67--72},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/CDC.2008.4739452},
  doi          = {10.1109/CDC.2008.4739452},
  timestamp    = {Fri, 04 Mar 2022 13:27:23 +0100},
  biburl       = {https://dblp.org/rec/conf/cdc/FariasW08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iconip/DauwelsVWC09,
  author       = {Justin Dauwels and
                  Fran{\c{c}}ois B. Vialatte and
                  Theophane Weber and
                  Andrzej Cichocki},
  editor       = {Mario K{\"{o}}ppen and
                  Nikola K. Kasabov and
                  George G. Coghill},
  title        = {On Similarity Measures for Spike Trains},
  booktitle    = {Advances in Neuro-Information Processing, 15th International Conference,
                  {ICONIP} 2008, Auckland, New Zealand, November 25-28, 2008, Revised
                  Selected Papers, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5506},
  pages        = {177--185},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-642-02490-0\_22},
  doi          = {10.1007/978-3-642-02490-0\_22},
  timestamp    = {Sun, 02 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iconip/DauwelsVWC09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iconip/DauwelsVWC09a,
  author       = {Justin Dauwels and
                  Fran{\c{c}}ois B. Vialatte and
                  Theophane Weber and
                  Andrzej Cichocki},
  editor       = {Mario K{\"{o}}ppen and
                  Nikola K. Kasabov and
                  George G. Coghill},
  title        = {An Exemplar-Based Statistical Model for the Dynamics of Neural Synchrony},
  booktitle    = {Advances in Neuro-Information Processing, 15th International Conference,
                  {ICONIP} 2008, Auckland, New Zealand, November 25-28, 2008, Revised
                  Selected Papers, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5506},
  pages        = {318--326},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-642-02490-0\_39},
  doi          = {10.1007/978-3-642-02490-0\_39},
  timestamp    = {Sun, 02 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iconip/DauwelsVWC09a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics