BibTeX records: Aviv Tamar

download as .bib file

@article{DBLP:journals/corr/abs-2403-09859,
  author       = {Zohar Rimon and
                  Tom Jurgenson and
                  Orr Krupnik and
                  Gilad Adler and
                  Aviv Tamar},
  title        = {{MAMBA:} an Effective World Model Approach for Meta-Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2403.09859},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.09859},
  doi          = {10.48550/ARXIV.2403.09859},
  eprinttype    = {arXiv},
  eprint       = {2403.09859},
  timestamp    = {Fri, 05 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-09859.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/KrupnikSJT23,
  author       = {Orr Krupnik and
                  Elisei Shafer and
                  Tom Jurgenson and
                  Aviv Tamar},
  editor       = {Jie Tan and
                  Marc Toussaint and
                  Kourosh Darvish},
  title        = {Fine-Tuning Generative Models as an Inference Method for Robotic Tasks},
  booktitle    = {Conference on Robot Learning, CoRL 2023, 6-9 November 2023, Atlanta,
                  GA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {229},
  pages        = {866--886},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v229/krupnik23a.html},
  timestamp    = {Tue, 20 Feb 2024 12:11:46 +0100},
  biburl       = {https://dblp.org/rec/conf/corl/KrupnikSJT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/SudryJTK23,
  author       = {Matan Sudry and
                  Tom Jurgenson and
                  Aviv Tamar and
                  Erez Karpas},
  editor       = {Jie Tan and
                  Marc Toussaint and
                  Kourosh Darvish},
  title        = {Hierarchical Planning for Rope Manipulation using Knot Theory and
                  a Learned Inverse Model},
  booktitle    = {Conference on Robot Learning, CoRL 2023, 6-9 November 2023, Atlanta,
                  GA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {229},
  pages        = {1596--1609},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v229/sudry23a.html},
  timestamp    = {Tue, 20 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/corl/SudryJTK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ChoshenT23,
  author       = {Era Choshen and
                  Aviv Tamar},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {ContraBAR: Contrastive Bayes-Adaptive Deep {RL}},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {6005--6027},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/choshen23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ChoshenT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LeibovichJANT23,
  author       = {Gal Leibovich and
                  Guy Jacob and
                  Or Avner and
                  Gal Novik and
                  Aviv Tamar},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Learning Control by Iterative Inversion},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {19228--19255},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/leibovich23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LeibovichJANT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ShenfeldHTA23,
  author       = {Idan Shenfeld and
                  Zhang{-}Wei Hong and
                  Aviv Tamar and
                  Pulkit Agrawal},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {{TGRL:} An Algorithm for Teacher Guided Reinforcement Learning},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {31077--31093},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/shenfeld23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ShenfeldHTA23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/RohanimaneshMRT23,
  author       = {Khashayar Rohanimanesh and
                  Jake Metzger and
                  William Richards and
                  Aviv Tamar},
  title        = {Online Tool Selection with Learned Grasp Prediction Models},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2023, London, UK, May 29 - June 2, 2023},
  pages        = {5844--5850},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICRA48891.2023.10160952},
  doi          = {10.1109/ICRA48891.2023.10160952},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/RohanimaneshMRT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZisselmanLST23,
  author       = {Ev Zisselman and
                  Itai Lavie and
                  Daniel Soudry and
                  Aviv Tamar},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Explore to Generalize in Zero-Shot {RL}},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/c793577b644268259b1416464a6cdb8c-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZisselmanLST23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nsdi/PerryFHKMST23,
  author       = {Yarin Perry and
                  Felipe Vieira Frujeri and
                  Chaim Hoch and
                  Srikanth Kandula and
                  Ishai Menache and
                  Michael Schapira and
                  Aviv Tamar},
  editor       = {Mahesh Balakrishnan and
                  Manya Ghobadi},
  title        = {{DOTE:} Rethinking (Predictive) {WAN} Traffic Engineering},
  booktitle    = {20th {USENIX} Symposium on Networked Systems Design and Implementation,
                  {NSDI} 2023, Boston, MA, April 17-19, 2023},
  pages        = {1557--1581},
  publisher    = {{USENIX} Association},
  year         = {2023},
  url          = {https://www.usenix.org/conference/nsdi23/presentation/perry},
  timestamp    = {Thu, 11 May 2023 17:08:22 +0200},
  biburl       = {https://dblp.org/rec/conf/nsdi/PerryFHKMST23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sp/ZurDVET23,
  author       = {Roi Bar Zur and
                  Danielle Dori and
                  Sharon Vardi and
                  Ittay Eyal and
                  Aviv Tamar},
  title        = {Deep Bribe: Predicting the Rise of Bribery in Blockchain Mining with
                  Deep {RL}},
  booktitle    = {2023 {IEEE} Security and Privacy Workshops (SPW), San Francisco, CA,
                  USA, May 25, 2023},
  pages        = {29--37},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/SPW59333.2023.00008},
  doi          = {10.1109/SPW59333.2023.00008},
  timestamp    = {Thu, 21 Sep 2023 16:11:09 +0200},
  biburl       = {https://dblp.org/rec/conf/sp/ZurDVET23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sp/ZurAET23,
  author       = {Roi Bar Zur and
                  Ameer Abu{-}Hanna and
                  Ittay Eyal and
                  Aviv Tamar},
  title        = {WeRLman: To Tackle Whale (Transactions), Go Deep {(RL)}},
  booktitle    = {44th {IEEE} Symposium on Security and Privacy, {SP} 2023, San Francisco,
                  CA, USA, May 21-25, 2023},
  pages        = {93--110},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/SP46215.2023.10179444},
  doi          = {10.1109/SP46215.2023.10179444},
  timestamp    = {Thu, 27 Jul 2023 08:17:10 +0200},
  biburl       = {https://dblp.org/rec/conf/sp/ZurAET23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-01320,
  author       = {Shie Mannor and
                  Aviv Tamar},
  title        = {Towards Deployable {RL} - What's Broken with {RL} Research and a Potential
                  Fix},
  journal      = {CoRR},
  volume       = {abs/2301.01320},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.01320},
  doi          = {10.48550/ARXIV.2301.01320},
  eprinttype    = {arXiv},
  eprint       = {2301.01320},
  timestamp    = {Tue, 10 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-01320.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-07940,
  author       = {Khashayar Rohanimanesh and
                  Jake Metzger and
                  William Richards and
                  Aviv Tamar},
  title        = {Online Tool Selection with Learned Grasp Prediction Models},
  journal      = {CoRR},
  volume       = {abs/2302.07940},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.07940},
  doi          = {10.48550/ARXIV.2302.07940},
  eprinttype    = {arXiv},
  eprint       = {2302.07940},
  timestamp    = {Mon, 20 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-07940.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-00735,
  author       = {Yarin Perry and
                  Felipe Vieira Frujeri and
                  Chaim Hoch and
                  Srikanth Kandula and
                  Ishai Menache and
                  Michael Schapira and
                  Aviv Tamar},
  title        = {A Deep Learning Perspective on Network Routing},
  journal      = {CoRR},
  volume       = {abs/2303.00735},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.00735},
  doi          = {10.48550/ARXIV.2303.00735},
  eprinttype    = {arXiv},
  eprint       = {2303.00735},
  timestamp    = {Tue, 14 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-00735.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-10171,
  author       = {Tom Jurgenson and
                  Aviv Tamar},
  title        = {Goal-Conditioned Supervised Learning with Sub-Goal Prediction},
  journal      = {CoRR},
  volume       = {abs/2305.10171},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.10171},
  doi          = {10.48550/ARXIV.2305.10171},
  eprinttype    = {arXiv},
  eprint       = {2305.10171},
  timestamp    = {Wed, 24 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-10171.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-02418,
  author       = {Era Choshen and
                  Aviv Tamar},
  title        = {ContraBAR: Contrastive Bayes-Adaptive Deep {RL}},
  journal      = {CoRR},
  volume       = {abs/2306.02418},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.02418},
  doi          = {10.48550/ARXIV.2306.02418},
  eprinttype    = {arXiv},
  eprint       = {2306.02418},
  timestamp    = {Tue, 13 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-02418.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-03072,
  author       = {Ev Zisselman and
                  Itai Lavie and
                  Daniel Soudry and
                  Aviv Tamar},
  title        = {Explore to Generalize in Zero-Shot {RL}},
  journal      = {CoRR},
  volume       = {abs/2306.03072},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.03072},
  doi          = {10.48550/ARXIV.2306.03072},
  eprinttype    = {arXiv},
  eprint       = {2306.03072},
  timestamp    = {Tue, 13 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-03072.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-05957,
  author       = {Tal Daniel and
                  Aviv Tamar},
  title        = {{DDLP:} Unsupervised Object-Centric Video Prediction with Deep Dynamic
                  Latent Particles},
  journal      = {CoRR},
  volume       = {abs/2306.05957},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.05957},
  doi          = {10.48550/ARXIV.2306.05957},
  eprinttype    = {arXiv},
  eprint       = {2306.05957},
  timestamp    = {Wed, 14 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-05957.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-03186,
  author       = {Idan Shenfeld and
                  Zhang{-}Wei Hong and
                  Aviv Tamar and
                  Pulkit Agrawal},
  title        = {{TGRL:} An Algorithm for Teacher Guided Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2307.03186},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.03186},
  doi          = {10.48550/ARXIV.2307.03186},
  eprinttype    = {arXiv},
  eprint       = {2307.03186},
  timestamp    = {Mon, 10 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-03186.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-12862,
  author       = {Orr Krupnik and
                  Elisei Shafer and
                  Tom Jurgenson and
                  Aviv Tamar},
  title        = {Fine-Tuning Generative Models as an Inference Method for Robotic Tasks},
  journal      = {CoRR},
  volume       = {abs/2310.12862},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.12862},
  doi          = {10.48550/ARXIV.2310.12862},
  eprinttype    = {arXiv},
  eprint       = {2310.12862},
  timestamp    = {Fri, 27 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-12862.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/iacr/ZurDVET23,
  author       = {Roi Bar Zur and
                  Danielle Dori and
                  Sharon Vardi and
                  Ittay Eyal and
                  Aviv Tamar},
  title        = {Deep Bribe: Predicting the Rise of Bribery in Blockchain Mining with
                  Deep {RL}},
  journal      = {{IACR} Cryptol. ePrint Arch.},
  pages        = {472},
  year         = {2023},
  url          = {https://eprint.iacr.org/2023/472},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/iacr/ZurDVET23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/TamarSZ22,
  author       = {Aviv Tamar and
                  Daniel Soudry and
                  Ev Zisselman},
  title        = {Regularization Guarantees Generalization in Bayesian Reinforcement
                  Learning through Algorithmic Stability},
  booktitle    = {Thirty-Sixth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2022, Thirty-Fourth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2022, The Twelveth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2022 Virtual Event, February 22
                  - March 1, 2022},
  pages        = {8423--8431},
  publisher    = {{AAAI} Press},
  year         = {2022},
  url          = {https://doi.org/10.1609/aaai.v36i8.20818},
  doi          = {10.1609/AAAI.V36I8.20818},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/TamarSZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DanielT22,
  author       = {Tal Daniel and
                  Aviv Tamar},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Unsupervised Image Representation Learning with Deep Latent Particles},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {4644--4665},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/daniel22a.html},
  timestamp    = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DanielT22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/LeibovichJENT22,
  author       = {Gal Leibovich and
                  Guy Jacob and
                  Shadi Endrawis and
                  Gal Novik and
                  Aviv Tamar},
  title        = {Validate on Sim, Detect on Real - Model Selection for Domain Randomization},
  booktitle    = {2022 International Conference on Robotics and Automation, {ICRA} 2022,
                  Philadelphia, PA, USA, May 23-27, 2022},
  pages        = {7528--7535},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICRA46639.2022.9811621},
  doi          = {10.1109/ICRA46639.2022.9811621},
  timestamp    = {Wed, 20 Jul 2022 18:22:23 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/LeibovichJENT22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RimonTA22,
  author       = {Zohar Rimon and
                  Aviv Tamar and
                  Gilad Adler},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Meta Reinforcement Learning with Finite Training Tasks - a Density
                  Estimation Approach},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/5833b4daf5b076dd1cdb362b163dff0c-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/RimonTA22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/systor/ZurAET22,
  author       = {Roi Bar Zur and
                  Ameer Abu{-}Hanna and
                  Ittay Eyal and
                  Aviv Tamar},
  editor       = {Michal Malka and
                  Hillel Kolodner and
                  Frank Bellosa and
                  Moshe Gabel},
  title        = {WeRLman: to tackle whale (transactions), go deep {(RL)}},
  booktitle    = {{SYSTOR} '22: The 15th {ACM} International Systems and Storage Conference,
                  Haifa, Israel, June 13 - 15, 2022},
  pages        = {148},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3534056.3535005},
  doi          = {10.1145/3534056.3535005},
  timestamp    = {Mon, 13 Jun 2022 17:06:26 +0200},
  biburl       = {https://dblp.org/rec/conf/systor/ZurAET22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-15821,
  author       = {Tal Daniel and
                  Aviv Tamar},
  title        = {Unsupervised Image Representation Learning with Deep Latent Particles},
  journal      = {CoRR},
  volume       = {abs/2205.15821},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.15821},
  doi          = {10.48550/ARXIV.2205.15821},
  eprinttype    = {arXiv},
  eprint       = {2205.15821},
  timestamp    = {Wed, 01 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-15821.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-10716,
  author       = {Zohar Rimon and
                  Aviv Tamar and
                  Gilad Adler},
  title        = {Meta Reinforcement Learning with Finite Training Tasks - a Density
                  Estimation Approach},
  journal      = {CoRR},
  volume       = {abs/2206.10716},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.10716},
  doi          = {10.48550/ARXIV.2206.10716},
  eprinttype    = {arXiv},
  eprint       = {2206.10716},
  timestamp    = {Mon, 27 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-10716.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-01724,
  author       = {Gal Leibovich and
                  Guy Jacob and
                  Or Avner and
                  Gal Novik and
                  Aviv Tamar},
  title        = {Learning Control by Iterative Inversion},
  journal      = {CoRR},
  volume       = {abs/2211.01724},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.01724},
  doi          = {10.48550/ARXIV.2211.01724},
  eprinttype    = {arXiv},
  eprint       = {2211.01724},
  timestamp    = {Fri, 04 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-01724.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/iacr/ZurAET22,
  author       = {Roi Bar Zur and
                  Ameer Abu{-}Hanna and
                  Ittay Eyal and
                  Aviv Tamar},
  title        = {WeRLman: To Tackle Whale (Transactions), Go Deep {(RL)}},
  journal      = {{IACR} Cryptol. ePrint Arch.},
  pages        = {175},
  year         = {2022},
  url          = {https://eprint.iacr.org/2022/175},
  timestamp    = {Tue, 22 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/iacr/ZurAET22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/DanielT21,
  author       = {Tal Daniel and
                  Aviv Tamar},
  title        = {Soft-IntroVAE: Analyzing and Improving the Introspective Variational
                  Autoencoder},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2021, virtual, June 19-25, 2021},
  pages        = {4391--4400},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2021},
  url          = {https://openaccess.thecvf.com/content/CVPR2021/html/Daniel\_Soft-IntroVAE\_Analyzing\_and\_Improving\_the\_Introspective\_Variational\_Autoencoder\_CVPR\_2021\_paper.html},
  doi          = {10.1109/CVPR46437.2021.00437},
  timestamp    = {Mon, 18 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/DanielT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/EndrawisLJNT21,
  author       = {Shadi Endrawis and
                  Gal Leibovich and
                  Guy Jacob and
                  Gal Novik and
                  Aviv Tamar},
  title        = {Efficient Self-Supervised Data Collection for Offline Robot Learning},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {4650--4656},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9561097},
  doi          = {10.1109/ICRA48506.2021.9561097},
  timestamp    = {Fri, 22 Oct 2021 19:54:31 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/EndrawisLJNT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/RabinovitzGT21,
  author       = {Carmel Rabinovitz and
                  Niko A. Grupen and
                  Aviv Tamar},
  title        = {Unsupervised Feature Learning for Manipulation with Contrastive Domain
                  Randomization},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {10153--10159},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9561527},
  doi          = {10.1109/ICRA48506.2021.9561527},
  timestamp    = {Mon, 25 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/RabinovitzGT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DorfmanST21,
  author       = {Ron Dorfman and
                  Idan Shenfeld and
                  Aviv Tamar},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Offline Meta Reinforcement Learning - Identifiability Challenges and
                  Effective Data Collection Strategies},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {4607--4618},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/248024541dbda1d3fd75fe49d1a4df4d-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DorfmanST21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-11144,
  author       = {Carmel Rabinovitz and
                  Niko A. Grupen and
                  Aviv Tamar},
  title        = {Unsupervised Feature Learning for Manipulation with Contrastive Domain
                  Randomization},
  journal      = {CoRR},
  volume       = {abs/2103.11144},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.11144},
  eprinttype    = {arXiv},
  eprint       = {2103.11144},
  timestamp    = {Wed, 24 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-11144.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-04607,
  author       = {Shadi Endrawis and
                  Gal Leibovich and
                  Guy Jacob and
                  Gal Novik and
                  Aviv Tamar},
  title        = {Efficient Self-Supervised Data Collection for Offline Robot Learning},
  journal      = {CoRR},
  volume       = {abs/2105.04607},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.04607},
  eprinttype    = {arXiv},
  eprint       = {2105.04607},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-04607.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-11792,
  author       = {Aviv Tamar and
                  Daniel Soudry and
                  Ev Zisselman},
  title        = {Regularization Guarantees Generalization in Bayesian Reinforcement
                  Learning through Algorithmic Stability},
  journal      = {CoRR},
  volume       = {abs/2109.11792},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.11792},
  eprinttype    = {arXiv},
  eprint       = {2109.11792},
  timestamp    = {Mon, 27 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-11792.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-00765,
  author       = {Gal Leibovich and
                  Guy Jacob and
                  Shadi Endrawis and
                  Gal Novik and
                  Aviv Tamar},
  title        = {Validate on Sim, Detect on Real - Model Selection for Domain Randomization},
  journal      = {CoRR},
  volume       = {abs/2111.00765},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.00765},
  eprinttype    = {arXiv},
  eprint       = {2111.00765},
  timestamp    = {Fri, 05 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-00765.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aft/ZurET20,
  author       = {Roi Bar Zur and
                  Ittay Eyal and
                  Aviv Tamar},
  title        = {Efficient {MDP} Analysis for Selfish-Mining in Blockchains},
  booktitle    = {{AFT} '20: 2nd {ACM} Conference on Advances in Financial Technologies,
                  New York, NY, USA, October 21-23, 2020},
  pages        = {113--131},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3419614.3423264},
  doi          = {10.1145/3419614.3423264},
  timestamp    = {Thu, 29 Oct 2020 14:40:13 +0100},
  biburl       = {https://dblp.org/rec/conf/aft/ZurET20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/ZisselmanT20,
  author       = {Ev Zisselman and
                  Aviv Tamar},
  title        = {Deep Residual Flow for Out of Distribution Detection},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {13991--14000},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Zisselman\_Deep\_Residual\_Flow\_for\_Out\_of\_Distribution\_Detection\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.01401},
  timestamp    = {Tue, 31 Aug 2021 14:00:04 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/ZisselmanT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hotnets/RotmanST20,
  author       = {Noga H. Rotman and
                  Michael Schapira and
                  Aviv Tamar},
  editor       = {Ben Y. Zhao and
                  Heather Zheng and
                  Harsha V. Madhyastha and
                  Venkat N. Padmanabhan},
  title        = {Online Safety Assurance for Learning-Augmented Systems},
  booktitle    = {HotNets '20: The 19th {ACM} Workshop on Hot Topics in Networks, Virtual
                  Event, USA, November 4-6, 2020},
  pages        = {88--95},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3422604.3425940},
  doi          = {10.1145/3422604.3425940},
  timestamp    = {Mon, 20 Jun 2022 09:15:37 +0200},
  biburl       = {https://dblp.org/rec/conf/hotnets/RotmanST20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JurgensonAGT20,
  author       = {Tom Jurgenson and
                  Or Avner and
                  Edward Groshev and
                  Aviv Tamar},
  title        = {Sub-Goal Trees a Framework for Goal-Based Reinforcement Learning},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {5020--5030},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/jurgenson20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/JurgensonAGT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LiuKTAT20,
  author       = {Kara Liu and
                  Thanard Kurutach and
                  Christine Tung and
                  Pieter Abbeel and
                  Aviv Tamar},
  title        = {Hallucinative Topological Memory for Zero-Shot Visual Planning},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {6259--6270},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/liu20h.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LiuKTAT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/SarafianTK20,
  author       = {Elad Sarafian and
                  Aviv Tamar and
                  Sarit Kraus},
  editor       = {Christian Bessiere},
  title        = {Constrained Policy Improvement for Efficient Reinforcement Learning},
  booktitle    = {Proceedings of the Twenty-Ninth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2020},
  pages        = {2863--2871},
  publisher    = {ijcai.org},
  year         = {2020},
  url          = {https://doi.org/10.24963/ijcai.2020/396},
  doi          = {10.24963/IJCAI.2020/396},
  timestamp    = {Mon, 20 Jul 2020 12:38:52 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/SarafianTK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-05419,
  author       = {Ev Zisselman and
                  Aviv Tamar},
  title        = {Deep Residual Flow for Novelty Detection},
  journal      = {CoRR},
  volume       = {abs/2001.05419},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.05419},
  eprinttype    = {arXiv},
  eprint       = {2001.05419},
  timestamp    = {Fri, 17 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-05419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-12336,
  author       = {Kara Liu and
                  Thanard Kurutach and
                  Christine Tung and
                  Pieter Abbeel and
                  Aviv Tamar},
  title        = {Hallucinative Topological Memory for Zero-Shot Visual Planning},
  journal      = {CoRR},
  volume       = {abs/2002.12336},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.12336},
  eprinttype    = {arXiv},
  eprint       = {2002.12336},
  timestamp    = {Tue, 03 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-12336.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-12361,
  author       = {Tom Jurgenson and
                  Or Avner and
                  Edward Groshev and
                  Aviv Tamar},
  title        = {Sub-Goal Trees - a Framework for Goal-Based Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2002.12361},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.12361},
  eprinttype    = {arXiv},
  eprint       = {2002.12361},
  timestamp    = {Tue, 05 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-12361.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-05614,
  author       = {Roi Bar Zur and
                  Ittay Eyal and
                  Aviv Tamar},
  title        = {Efficient {MDP} Analysis for Selfish-Mining in Blockchains},
  journal      = {CoRR},
  volume       = {abs/2007.05614},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.05614},
  eprinttype    = {arXiv},
  eprint       = {2007.05614},
  timestamp    = {Mon, 20 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-05614.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-02598,
  author       = {Ron Dorfman and
                  Aviv Tamar},
  title        = {Offline Meta Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2008.02598},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.02598},
  eprinttype    = {arXiv},
  eprint       = {2008.02598},
  timestamp    = {Fri, 07 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-02598.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-09408,
  author       = {Tzvika Geft and
                  Aviv Tamar and
                  Ken Goldberg and
                  Dan Halperin},
  title        = {Robust 2D Assembly Sequencing via Geometric Planning with Learned
                  Scores},
  journal      = {CoRR},
  volume       = {abs/2009.09408},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.09408},
  eprinttype    = {arXiv},
  eprint       = {2009.09408},
  timestamp    = {Wed, 23 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-09408.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-03625,
  author       = {Noga H. Rotman and
                  Michael Schapira and
                  Aviv Tamar},
  title        = {Online Safety Assurance for Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2010.03625},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.03625},
  eprinttype    = {arXiv},
  eprint       = {2010.03625},
  timestamp    = {Tue, 13 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-03625.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-13253,
  author       = {Tal Daniel and
                  Aviv Tamar},
  title        = {Soft-IntroVAE: Analyzing and Improving the Introspective Variational
                  Autoencoder},
  journal      = {CoRR},
  volume       = {abs/2012.13253},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.13253},
  eprinttype    = {arXiv},
  eprint       = {2012.13253},
  timestamp    = {Tue, 05 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-13253.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amcc/ChapmanLTLSCFJP19,
  author       = {Margaret P. Chapman and
                  Jonathan Lacotte and
                  Aviv Tamar and
                  Donggun Lee and
                  Kevin M. Smith and
                  Victoria Cheng and
                  Jaime F. Fisac and
                  Susmit Jha and
                  Marco Pavone and
                  Claire J. Tomlin},
  title        = {A Risk-Sensitive Finite-Time Reachability Approach for Safety of Stochastic
                  Dynamic Systems},
  booktitle    = {2019 American Control Conference, {ACC} 2019, Philadelphia, PA, USA,
                  July 10-12, 2019},
  pages        = {2958--2963},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.23919/ACC.2019.8815169},
  doi          = {10.23919/ACC.2019.8815169},
  timestamp    = {Mon, 19 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/amcc/ChapmanLTLSCFJP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/case/GeftTGH19,
  author       = {Tzvika Geft and
                  Aviv Tamar and
                  Ken Goldberg and
                  Dan Halperin},
  title        = {Robust 2D Assembly Sequencing via Geometric Planning with Learned
                  Scores},
  booktitle    = {15th {IEEE} International Conference on Automation Science and Engineering,
                  {CASE} 2019, Vancouver, BC, Canada, August 22-26, 2019},
  pages        = {1603--1610},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/COASE.2019.8843109},
  doi          = {10.1109/COASE.2019.8843109},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/case/GeftTGH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/KrupnikMT19,
  author       = {Orr Krupnik and
                  Igor Mordatch and
                  Aviv Tamar},
  editor       = {Leslie Pack Kaelbling and
                  Danica Kragic and
                  Komei Sugiura},
  title        = {Multi-Agent Reinforcement Learning with Multi-Step Generative Models},
  booktitle    = {3rd Annual Conference on Robot Learning, CoRL 2019, Osaka, Japan,
                  October 30 - November 1, 2019, Proceedings},
  series       = {Proceedings of Machine Learning Research},
  volume       = {100},
  pages        = {776--790},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v100/krupnik20a.html},
  timestamp    = {Mon, 25 May 2020 12:12:52 +0200},
  biburl       = {https://dblp.org/rec/conf/corl/KrupnikMT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/WuWTRGT19,
  author       = {Yi Wu and
                  Yuxin Wu and
                  Aviv Tamar and
                  Stuart Russell and
                  Georgia Gkioxari and
                  Yuandong Tian},
  title        = {Bayesian Relational Memory for Semantic Visual Navigation},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2019, Seoul, Korea (South), October 27 - November 2, 2019},
  pages        = {2769--2779},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCV.2019.00286},
  doi          = {10.1109/ICCV.2019.00286},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccv/WuWTRGT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/FreirichSMT19,
  author       = {Dror Freirich and
                  Tzahi Shimkin and
                  Ron Meir and
                  Aviv Tamar},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Distributional Multivariate Policy Evaluation and Exploration with
                  the Bellman {GAN}},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {1983--1992},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/freirich19a.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/FreirichSMT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JayRGST19,
  author       = {Nathan Jay and
                  Noga H. Rotman and
                  Brighten Godfrey and
                  Michael Schapira and
                  Aviv Tamar},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {A Deep Reinforcement Learning Perspective on Internet Congestion Control},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {3050--3059},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/jay19a.html},
  timestamp    = {Tue, 11 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/JayRGST19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/LuoSWOATA19,
  author       = {Jianlan Luo and
                  Eugen Solowjow and
                  Chengtao Wen and
                  Juan Aparicio Ojea and
                  Alice M. Agogino and
                  Aviv Tamar and
                  Pieter Abbeel},
  title        = {Reinforcement Learning on Variable Impedance Controller for High-Precision
                  Robotic Assembly},
  booktitle    = {International Conference on Robotics and Automation, {ICRA} 2019,
                  Montreal, QC, Canada, May 20-24, 2019},
  pages        = {3080--3087},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICRA.2019.8793506},
  doi          = {10.1109/ICRA.2019.8793506},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/LuoSWOATA19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/RenLSO0TA19,
  author       = {Xinyi Ren and
                  Jianlan Luo and
                  Eugen Solowjow and
                  Juan Aparicio Ojea and
                  Abhishek Gupta and
                  Aviv Tamar and
                  Pieter Abbeel},
  title        = {Domain Randomization for Active Pose Estimation},
  booktitle    = {International Conference on Robotics and Automation, {ICRA} 2019,
                  Montreal, QC, Canada, May 20-24, 2019},
  pages        = {7228--7234},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICRA.2019.8794126},
  doi          = {10.1109/ICRA.2019.8794126},
  timestamp    = {Tue, 13 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/RenLSO0TA19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rss/JurgensonT19,
  author       = {Tom Jurgenson and
                  Aviv Tamar},
  editor       = {Antonio Bicchi and
                  Hadas Kress{-}Gazit and
                  Seth Hutchinson},
  title        = {Harnessing Reinforcement Learning for Neural Motion Planning},
  booktitle    = {Robotics: Science and Systems XV, University of Freiburg, Freiburg
                  im Breisgau, Germany, June 22-26, 2019},
  year         = {2019},
  url          = {https://doi.org/10.15607/RSS.2019.XV.026},
  doi          = {10.15607/RSS.2019.XV.026},
  timestamp    = {Thu, 01 Apr 2021 15:25:13 +0200},
  biburl       = {https://dblp.org/rec/conf/rss/JurgensonT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rss/WangKAT19,
  author       = {Angelina Wang and
                  Thanard Kurutach and
                  Pieter Abbeel and
                  Aviv Tamar},
  editor       = {Antonio Bicchi and
                  Hadas Kress{-}Gazit and
                  Seth Hutchinson},
  title        = {Learning Robotic Manipulation through Visual Planning and Acting},
  booktitle    = {Robotics: Science and Systems XV, University of Freiburg, Freiburg
                  im Breisgau, Germany, June 22-26, 2019},
  year         = {2019},
  url          = {https://doi.org/10.15607/RSS.2019.XV.074},
  doi          = {10.15607/RSS.2019.XV.074},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/rss/WangKAT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-10251,
  author       = {Orr Krupnik and
                  Igor Mordatch and
                  Aviv Tamar},
  title        = {Multi Agent Reinforcement Learning with Multi-Step Generative Models},
  journal      = {CoRR},
  volume       = {abs/1901.10251},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.10251},
  eprinttype    = {arXiv},
  eprint       = {1901.10251},
  timestamp    = {Sat, 02 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-10251.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-11277,
  author       = {Margaret P. Chapman and
                  Jonathan Lacotte and
                  Aviv Tamar and
                  Donggun Lee and
                  Kevin M. Smith and
                  Victoria Cheng and
                  Jaime F. Fisac and
                  Susmit Jha and
                  Marco Pavone and
                  Claire J. Tomlin},
  title        = {A Risk-Sensitive Finite-Time Reachability Approach for Safety of Stochastic
                  Dynamic Systems},
  journal      = {CoRR},
  volume       = {abs/1902.11277},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.11277},
  eprinttype    = {arXiv},
  eprint       = {1902.11277},
  timestamp    = {Mon, 19 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-11277.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-01066,
  author       = {Jianlan Luo and
                  Eugen Solowjow and
                  Chengtao Wen and
                  Juan Aparicio Ojea and
                  Alice M. Agogino and
                  Aviv Tamar and
                  Pieter Abbeel},
  title        = {Reinforcement Learning on Variable Impedance Controller for High-Precision
                  Robotic Assembly},
  journal      = {CoRR},
  volume       = {abs/1903.01066},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.01066},
  eprinttype    = {arXiv},
  eprint       = {1903.01066},
  timestamp    = {Sat, 30 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-01066.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-03953,
  author       = {Xinyi Ren and
                  Jianlan Luo and
                  Eugen Solowjow and
                  Juan Aparicio Ojea and
                  Abhishek Gupta and
                  Aviv Tamar and
                  Pieter Abbeel},
  title        = {Domain Randomization for Active Pose Estimation},
  journal      = {CoRR},
  volume       = {abs/1903.03953},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.03953},
  eprinttype    = {arXiv},
  eprint       = {1903.03953},
  timestamp    = {Sun, 31 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-03953.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-04411,
  author       = {Angelina Wang and
                  Thanard Kurutach and
                  Kara Liu and
                  Pieter Abbeel and
                  Aviv Tamar},
  title        = {Learning Robotic Manipulation through Visual Planning and Acting},
  journal      = {CoRR},
  volume       = {abs/1905.04411},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.04411},
  eprinttype    = {arXiv},
  eprint       = {1905.04411},
  timestamp    = {Tue, 28 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-04411.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-00214,
  author       = {Tom Jurgenson and
                  Aviv Tamar},
  title        = {Harnessing Reinforcement Learning for Neural Motion Planning},
  journal      = {CoRR},
  volume       = {abs/1906.00214},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.00214},
  eprinttype    = {arXiv},
  eprint       = {1906.00214},
  timestamp    = {Thu, 13 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-00214.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-05329,
  author       = {Tom Jurgenson and
                  Edward Groshev and
                  Aviv Tamar},
  title        = {Sub-Goal Trees - a Framework for Goal-Directed Trajectory Prediction
                  and Optimization},
  journal      = {CoRR},
  volume       = {abs/1906.05329},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.05329},
  eprinttype    = {arXiv},
  eprint       = {1906.05329},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-05329.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-04306,
  author       = {Yi Wu and
                  Yuxin Wu and
                  Aviv Tamar and
                  Stuart Russell and
                  Georgia Gkioxari and
                  Yuandong Tian},
  title        = {Bayesian Relational Memory for Semantic Visual Navigation},
  journal      = {CoRR},
  volume       = {abs/1909.04306},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.04306},
  eprinttype    = {arXiv},
  eprint       = {1909.04306},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-04306.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-04971,
  author       = {Tal Daniel and
                  Thanard Kurutach and
                  Aviv Tamar},
  title        = {Deep Variational Semi-Supervised Novelty Detection},
  journal      = {CoRR},
  volume       = {abs/1911.04971},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.04971},
  eprinttype    = {arXiv},
  eprint       = {1911.04971},
  timestamp    = {Mon, 02 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-04971.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/GroshevTGSA18,
  author       = {Edward Groshev and
                  Aviv Tamar and
                  Maxwell Goldstein and
                  Siddharth Srivastava and
                  Pieter Abbeel},
  title        = {Learning Generalized Reactive Policies using Deep Neural Networks},
  booktitle    = {2018 {AAAI} Spring Symposia, Stanford University, Palo Alto, California,
                  USA, March 26-28, 2018},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://aaai.org/ocs/index.php/SSS/SSS18/paper/view/17533},
  timestamp    = {Tue, 08 Jan 2019 14:37:15 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/GroshevTGSA18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aips/GroshevGTSA18,
  author       = {Edward Groshev and
                  Maxwell Goldstein and
                  Aviv Tamar and
                  Siddharth Srivastava and
                  Pieter Abbeel},
  editor       = {Mathijs de Weerdt and
                  Sven Koenig and
                  Gabriele R{\"{o}}ger and
                  Matthijs T. J. Spaan},
  title        = {Learning Generalized Reactive Policies Using Deep Neural Networks},
  booktitle    = {Proceedings of the Twenty-Eighth International Conference on Automated
                  Planning and Scheduling, {ICAPS} 2018, Delft, The Netherlands, June
                  24-29, 2018},
  pages        = {408--416},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://aaai.org/ocs/index.php/ICAPS/ICAPS18/paper/view/17782},
  timestamp    = {Mon, 25 Jun 2018 13:32:06 +0200},
  biburl       = {https://dblp.org/rec/conf/aips/GroshevGTSA18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/KurutachCDTA18,
  author       = {Thanard Kurutach and
                  Ignasi Clavera and
                  Yan Duan and
                  Aviv Tamar and
                  Pieter Abbeel},
  title        = {Model-Ensemble Trust-Region Policy Optimization},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=SJJinbWRZ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KurutachCDTA18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/TamarRCVGKP18,
  author       = {Aviv Tamar and
                  Khashayar Rohanimanesh and
                  Yinlam Chow and
                  Chris Vigorito and
                  Ben Goodrich and
                  Michael Kahane and
                  Derik Pridmore},
  title        = {Imitation Learning from Visual Data with Multiple Intentions},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=Hk3ddfWRW},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/TamarRCVGKP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/ThomasCTOA18,
  author       = {Garrett Thomas and
                  Melissa Chien and
                  Aviv Tamar and
                  Juan Aparicio Ojea and
                  Pieter Abbeel},
  title        = {Learning Robotic Assembly from {CAD}},
  booktitle    = {2018 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2018, Brisbane, Australia, May 21-25, 2018},
  pages        = {1--9},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICRA.2018.8460696},
  doi          = {10.1109/ICRA.2018.8460696},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/ThomasCTOA18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KurutachTYRA18,
  author       = {Thanard Kurutach and
                  Aviv Tamar and
                  Ge Yang and
                  Stuart J. Russell and
                  Pieter Abbeel},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Learning Plannable Representations with Causal InfoGAN},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {8747--8758},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/08aac6ac98e59e523995c161e57875f5-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/KurutachTYRA18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-10592,
  author       = {Thanard Kurutach and
                  Ignasi Clavera and
                  Yan Duan and
                  Aviv Tamar and
                  Pieter Abbeel},
  title        = {Model-Ensemble Trust-Region Policy Optimization},
  journal      = {CoRR},
  volume       = {abs/1802.10592},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.10592},
  eprinttype    = {arXiv},
  eprint       = {1802.10592},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-10592.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1803-07635,
  author       = {Garrett Thomas and
                  Melissa Chien and
                  Aviv Tamar and
                  Juan Aparicio Ojea and
                  Pieter Abbeel},
  title        = {Learning Robotic Assembly from {CAD}},
  journal      = {CoRR},
  volume       = {abs/1803.07635},
  year         = {2018},
  url          = {http://arxiv.org/abs/1803.07635},
  eprinttype    = {arXiv},
  eprint       = {1803.07635},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1803-07635.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-07805,
  author       = {Elad Sarafian and
                  Aviv Tamar and
                  Sarit Kraus},
  title        = {Safe Policy Learning from Observations},
  journal      = {CoRR},
  volume       = {abs/1805.07805},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.07805},
  eprinttype    = {arXiv},
  eprint       = {1805.07805},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-07805.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-09341,
  author       = {Thanard Kurutach and
                  Aviv Tamar and
                  Ge Yang and
                  Stuart Russell and
                  Pieter Abbeel},
  title        = {Learning Plannable Representations with Causal InfoGAN},
  journal      = {CoRR},
  volume       = {abs/1807.09341},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.09341},
  eprinttype    = {arXiv},
  eprint       = {1807.09341},
  timestamp    = {Wed, 20 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-09341.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-01960,
  author       = {Dror Freirich and
                  Ron Meir and
                  Aviv Tamar},
  title        = {Distributional Multivariate Policy Evaluation and Exploration with
                  the Bellman {GAN}},
  journal      = {CoRR},
  volume       = {abs/1808.01960},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.01960},
  eprinttype    = {arXiv},
  eprint       = {1808.01960},
  timestamp    = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-01960.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-10842,
  author       = {Yi Wu and
                  Yuxin Wu and
                  Aviv Tamar and
                  Stuart Russell and
                  Georgia Gkioxari and
                  Yuandong Tian},
  title        = {Learning and Planning with a Semantic Model},
  journal      = {CoRR},
  volume       = {abs/1809.10842},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.10842},
  eprinttype    = {arXiv},
  eprint       = {1809.10842},
  timestamp    = {Wed, 20 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-10842.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-03259,
  author       = {Nathan Jay and
                  Noga H. Rotman and
                  Philip Brighten Godfrey and
                  Michael Schapira and
                  Aviv Tamar},
  title        = {Internet Congestion Control via Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1810.03259},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.03259},
  eprinttype    = {arXiv},
  eprint       = {1810.03259},
  timestamp    = {Tue, 30 Oct 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-03259.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tac/TamarCGM17,
  author       = {Aviv Tamar and
                  Yinlam Chow and
                  Mohammad Ghavamzadeh and
                  Shie Mannor},
  title        = {Sequential Decision Making With Coherent Risk},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {62},
  number       = {7},
  pages        = {3323--3338},
  year         = {2017},
  url          = {https://doi.org/10.1109/TAC.2016.2644871},
  doi          = {10.1109/TAC.2016.2644871},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/TamarCGM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hotnets/ValadarskySST17,
  author       = {Asaf Valadarsky and
                  Michael Schapira and
                  Dafna Shahaf and
                  Aviv Tamar},
  editor       = {Sujata Banerjee and
                  Brad Karp and
                  Michael Walfish},
  title        = {Learning to Route},
  booktitle    = {Proceedings of the 16th {ACM} Workshop on Hot Topics in Networks,
                  Palo Alto, CA, USA, HotNets 2017, November 30 - December 01, 2017},
  pages        = {185--191},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3152434.3152441},
  doi          = {10.1145/3152434.3152441},
  timestamp    = {Tue, 06 Nov 2018 16:58:14 +0100},
  biburl       = {https://dblp.org/rec/conf/hotnets/ValadarskySST17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/AchiamHTA17,
  author       = {Joshua Achiam and
                  David Held and
                  Aviv Tamar and
                  Pieter Abbeel},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Constrained Policy Optimization},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {22--31},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/achiam17a.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/AchiamHTA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/TamarTZLA17,
  author       = {Aviv Tamar and
                  Garrett Thomas and
                  Tianhao Zhang and
                  Sergey Levine and
                  Pieter Abbeel},
  title        = {Learning from the hindsight plan - Episodic {MPC} improvement},
  booktitle    = {2017 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2017, Singapore, Singapore, May 29 - June 3, 2017},
  pages        = {336--343},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICRA.2017.7989043},
  doi          = {10.1109/ICRA.2017.7989043},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/TamarTZLA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/TamarWTLA17,
  author       = {Aviv Tamar and
                  Yi Wu and
                  Garrett Thomas and
                  Sergey Levine and
                  Pieter Abbeel},
  editor       = {Carles Sierra},
  title        = {Value Iteration Networks},
  booktitle    = {Proceedings of the Twenty-Sixth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August
                  19-25, 2017},
  pages        = {4949--4953},
  publisher    = {ijcai.org},
  year         = {2017},
  url          = {https://doi.org/10.24963/ijcai.2017/700},
  doi          = {10.24963/IJCAI.2017/700},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/TamarWTLA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LevineZMTM17,
  author       = {Nir Levine and
                  Tom Zahavy and
                  Daniel J. Mankowitz and
                  Aviv Tamar and
                  Shie Mannor},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Shallow Updates for Deep Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {3135--3145},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/393c55aea738548df743a186d15f3bef-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 13:58:27 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LevineZMTM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LoweWTHAM17,
  author       = {Ryan Lowe and
                  Yi Wu and
                  Aviv Tamar and
                  Jean Harb and
                  Pieter Abbeel and
                  Igor Mordatch},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Multi-Agent Actor-Critic for Mixed Cooperative-Competitive Environments},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {6379--6390},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/68a9750337a418a86fe06c1991a1d64c-Abstract.html},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/LoweWTHAM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LevineZMTM17,
  author       = {Nir Levine and
                  Tom Zahavy and
                  Daniel J. Mankowitz and
                  Aviv Tamar and
                  Shie Mannor},
  title        = {Shallow Updates for Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1705.07461},
  year         = {2017},
  url          = {http://arxiv.org/abs/1705.07461},
  eprinttype    = {arXiv},
  eprint       = {1705.07461},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LevineZMTM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AchiamHTA17,
  author       = {Joshua Achiam and
                  David Held and
                  Aviv Tamar and
                  Pieter Abbeel},
  title        = {Constrained Policy Optimization},
  journal      = {CoRR},
  volume       = {abs/1705.10528},
  year         = {2017},
  url          = {http://arxiv.org/abs/1705.10528},
  eprinttype    = {arXiv},
  eprint       = {1705.10528},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AchiamHTA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LoweWTHAM17,
  author       = {Ryan Lowe and
                  Yi Wu and
                  Aviv Tamar and
                  Jean Harb and
                  Pieter Abbeel and
                  Igor Mordatch},
  title        = {Multi-Agent Actor-Critic for Mixed Cooperative-Competitive Environments},
  journal      = {CoRR},
  volume       = {abs/1706.02275},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.02275},
  eprinttype    = {arXiv},
  eprint       = {1706.02275},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LoweWTHAM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-03074,
  author       = {Asaf Valadarsky and
                  Michael Schapira and
                  Dafna Shahaf and
                  Aviv Tamar},
  title        = {A Machine Learning Approach to Routing},
  journal      = {CoRR},
  volume       = {abs/1708.03074},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.03074},
  eprinttype    = {arXiv},
  eprint       = {1708.03074},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-03074.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-07280,
  author       = {Edward Groshev and
                  Aviv Tamar and
                  Siddharth Srivastava and
                  Pieter Abbeel},
  title        = {Learning Generalized Reactive Policies using Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1708.07280},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.07280},
  eprinttype    = {arXiv},
  eprint       = {1708.07280},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-07280.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-07832,
  author       = {Daniel J. Mankowitz and
                  Aviv Tamar and
                  Shie Mannor},
  title        = {Situationally Aware Options},
  journal      = {CoRR},
  volume       = {abs/1711.07832},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.07832},
  eprinttype    = {arXiv},
  eprint       = {1711.07832},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-07832.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-08534,
  author       = {William Wang and
                  Angelina Wang and
                  Aviv Tamar and
                  Xi Chen and
                  Pieter Abbeel},
  title        = {Safer Classification by Synthesis},
  journal      = {CoRR},
  volume       = {abs/1711.08534},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.08534},
  eprinttype    = {arXiv},
  eprint       = {1711.08534},
  timestamp    = {Mon, 03 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-08534.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/TamarCM16,
  author       = {Aviv Tamar and
                  Dotan Di Castro and
                  Shie Mannor},
  title        = {Learning the Variance of the Reward-To-Go},
  journal      = {J. Mach. Learn. Res.},
  volume       = {17},
  pages        = {13:1--13:36},
  year         = {2016},
  url          = {http://jmlr.org/papers/v17/14-335.html},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/TamarCM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HallakTMM16,
  author       = {Assaf Hallak and
                  Aviv Tamar and
                  R{\'{e}}mi Munos and
                  Shie Mannor},
  editor       = {Dale Schuurmans and
                  Michael P. Wellman},
  title        = {Generalized Emphatic Temporal Difference Learning: Bias-Variance Analysis},
  booktitle    = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence,
                  February 12-17, 2016, Phoenix, Arizona, {USA}},
  pages        = {1631--1637},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {https://doi.org/10.1609/aaai.v30i1.10227},
  doi          = {10.1609/AAAI.V30I1.10227},
  timestamp    = {Mon, 04 Sep 2023 15:08:28 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HallakTMM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/TamarLAWT16,
  author       = {Aviv Tamar and
                  Sergey Levine and
                  Pieter Abbeel and
                  Yi Wu and
                  Garrett Thomas},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {Value Iteration Networks},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {2146--2154},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/c21002f464c5fc5bee3b98ced83963b8-Abstract.html},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/TamarLAWT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TamarLA16,
  author       = {Aviv Tamar and
                  Sergey Levine and
                  Pieter Abbeel},
  title        = {Value Iteration Networks},
  journal      = {CoRR},
  volume       = {abs/1602.02867},
  year         = {2016},
  url          = {http://arxiv.org/abs/1602.02867},
  eprinttype    = {arXiv},
  eprint       = {1602.02867},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TamarLA16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GhavamzadehMPT16,
  author       = {Mohammad Ghavamzadeh and
                  Shie Mannor and
                  Joelle Pineau and
                  Aviv Tamar},
  title        = {Bayesian Reinforcement Learning: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/1609.04436},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.04436},
  eprinttype    = {arXiv},
  eprint       = {1609.04436},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GhavamzadehMPT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TamarTZLA16,
  author       = {Aviv Tamar and
                  Garrett Thomas and
                  Tianhao Zhang and
                  Sergey Levine and
                  Pieter Abbeel},
  title        = {Learning from the Hindsight Plan - Episodic {MPC} Improvement},
  journal      = {CoRR},
  volume       = {abs/1609.09001},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.09001},
  eprinttype    = {arXiv},
  eprint       = {1609.09001},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/TamarTZLA16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MankowitzTM16,
  author       = {Daniel J. Mankowitz and
                  Aviv Tamar and
                  Shie Mannor},
  title        = {Situational Awareness by Risk-Conscious Skills},
  journal      = {CoRR},
  volume       = {abs/1610.02847},
  year         = {2016},
  url          = {http://arxiv.org/abs/1610.02847},
  eprinttype    = {arXiv},
  eprint       = {1610.02847},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MankowitzTM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ftml/GhavamzadehMPT15,
  author       = {Mohammad Ghavamzadeh and
                  Shie Mannor and
                  Joelle Pineau and
                  Aviv Tamar},
  title        = {Bayesian Reinforcement Learning: {A} Survey},
  journal      = {Found. Trends Mach. Learn.},
  volume       = {8},
  number       = {5-6},
  pages        = {359--483},
  year         = {2015},
  url          = {https://doi.org/10.1561/2200000049},
  doi          = {10.1561/2200000049},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ftml/GhavamzadehMPT15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/TamarGM15,
  author       = {Aviv Tamar and
                  Yonatan Glassner and
                  Shie Mannor},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {Optimizing the CVaR via Sampling},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {2993--2999},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9561},
  doi          = {10.1609/AAAI.V29I1.9561},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/TamarGM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/TamarCGM15,
  author       = {Aviv Tamar and
                  Yinlam Chow and
                  Mohammad Ghavamzadeh and
                  Shie Mannor},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {Policy Gradient for Coherent Risk Measures},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {1468--1476},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/024d7f84fff11dd7e8d9c510137a2381-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/TamarCGM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChowTMP15,
  author       = {Yinlam Chow and
                  Aviv Tamar and
                  Shie Mannor and
                  Marco Pavone},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {Risk-Sensitive and Robust Decision-Making: a CVaR Optimization Approach},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {1522--1530},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/64223ccf70bbb65a3a4aceac37e21016-Abstract.html},
  timestamp    = {Mon, 19 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ChowTMP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TamarCGM15,
  author       = {Aviv Tamar and
                  Yinlam Chow and
                  Mohammad Ghavamzadeh and
                  Shie Mannor},
  title        = {Policy Gradient for Coherent Risk Measures},
  journal      = {CoRR},
  volume       = {abs/1502.03919},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.03919},
  eprinttype    = {arXiv},
  eprint       = {1502.03919},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TamarCGM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChowTMP15,
  author       = {Yinlam Chow and
                  Aviv Tamar and
                  Shie Mannor and
                  Marco Pavone},
  title        = {Risk-Sensitive and Robust Decision-Making: a CVaR Optimization Approach},
  journal      = {CoRR},
  volume       = {abs/1506.02188},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.02188},
  eprinttype    = {arXiv},
  eprint       = {1506.02188},
  timestamp    = {Mon, 19 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/ChowTMP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HallakTM15,
  author       = {Assaf Hallak and
                  Aviv Tamar and
                  Shie Mannor},
  title        = {Emphatic {TD} Bellman Operator is a Contraction},
  journal      = {CoRR},
  volume       = {abs/1508.03411},
  year         = {2015},
  url          = {http://arxiv.org/abs/1508.03411},
  eprinttype    = {arXiv},
  eprint       = {1508.03411},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HallakTM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HallakTMM15,
  author       = {Assaf Hallak and
                  Aviv Tamar and
                  R{\'{e}}mi Munos and
                  Shie Mannor},
  title        = {Generalized Emphatic Temporal Difference Learning: Bias-Variance Analysis},
  journal      = {CoRR},
  volume       = {abs/1509.05172},
  year         = {2015},
  url          = {http://arxiv.org/abs/1509.05172},
  eprinttype    = {arXiv},
  eprint       = {1509.05172},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HallakTMM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TamarMX14,
  author       = {Aviv Tamar and
                  Shie Mannor and
                  Huan Xu},
  title        = {Scaling Up Robust MDPs using Function Approximation},
  booktitle    = {Proceedings of the 31th International Conference on Machine Learning,
                  {ICML} 2014, Beijing, China, 21-26 June 2014},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {32},
  pages        = {181--189},
  publisher    = {JMLR.org},
  year         = {2014},
  url          = {http://proceedings.mlr.press/v32/tamar14.html},
  timestamp    = {Tue, 12 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/TamarMX14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TamarGM14,
  author       = {Aviv Tamar and
                  Yonatan Glassner and
                  Shie Mannor},
  title        = {Policy Gradients Beyond Expectations: Conditional Value-at-Risk},
  journal      = {CoRR},
  volume       = {abs/1404.3862},
  year         = {2014},
  url          = {http://arxiv.org/abs/1404.3862},
  eprinttype    = {arXiv},
  eprint       = {1404.3862},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TamarGM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TamarTMA14,
  author       = {Aviv Tamar and
                  Panos Toulis and
                  Shie Mannor and
                  Edoardo M. Airoldi},
  title        = {Implicit Temporal Differences},
  journal      = {CoRR},
  volume       = {abs/1412.6734},
  year         = {2014},
  url          = {http://arxiv.org/abs/1412.6734},
  eprinttype    = {arXiv},
  eprint       = {1412.6734},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TamarTMA14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TamarCM13,
  author       = {Aviv Tamar and
                  Dotan Di Castro and
                  Shie Mannor},
  title        = {Temporal Difference Methods for the Variance of the Reward To Go},
  booktitle    = {Proceedings of the 30th International Conference on Machine Learning,
                  {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {28},
  pages        = {495--503},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v28/tamar13.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/TamarCM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1301-0104,
  author       = {Aviv Tamar and
                  Dotan Di Castro and
                  Shie Mannor},
  title        = {Policy Evaluation with Variance Related Risk Criteria in Markov Decision
                  Processes},
  journal      = {CoRR},
  volume       = {abs/1301.0104},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.0104},
  eprinttype    = {arXiv},
  eprint       = {1301.0104},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-0104.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TamarXM13,
  author       = {Aviv Tamar and
                  Huan Xu and
                  Shie Mannor},
  title        = {Scaling Up Robust MDPs by Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1306.6189},
  year         = {2013},
  url          = {http://arxiv.org/abs/1306.6189},
  eprinttype    = {arXiv},
  eprint       = {1306.6189},
  timestamp    = {Tue, 12 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/TamarXM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TamarM13,
  author       = {Aviv Tamar and
                  Shie Mannor},
  title        = {Variance Adjusted Actor Critic Algorithms},
  journal      = {CoRR},
  volume       = {abs/1310.3697},
  year         = {2013},
  url          = {http://arxiv.org/abs/1310.3697},
  eprinttype    = {arXiv},
  eprint       = {1310.3697},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TamarM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/TamarCM12,
  author       = {Aviv Tamar and
                  Dotan Di Castro and
                  Ron Meir},
  title        = {Integrating a Partial Model into Model Free Reinforcement Learning},
  journal      = {J. Mach. Learn. Res.},
  volume       = {13},
  pages        = {1927--1966},
  year         = {2012},
  url          = {https://dl.acm.org/doi/10.5555/2503308.2343705},
  doi          = {10.5555/2503308.2343705},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/TamarCM12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/CastroTM12,
  author       = {Dotan Di Castro and
                  Aviv Tamar and
                  Shie Mannor},
  title        = {Policy Gradients with Variance Related Risk Criteria},
  booktitle    = {Proceedings of the 29th International Conference on Machine Learning,
                  {ICML} 2012, Edinburgh, Scotland, UK, June 26 - July 1, 2012},
  publisher    = {icml.cc / Omnipress},
  year         = {2012},
  url          = {http://icml.cc/2012/papers/489.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/CastroTM12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TamarCM11,
  author       = {Aviv Tamar and
                  Dotan Di Castro and
                  Ron Meir},
  editor       = {Lise Getoor and
                  Tobias Scheffer},
  title        = {Integrating Partial Model Knowledge in Model Free {RL} Algorithms},
  booktitle    = {Proceedings of the 28th International Conference on Machine Learning,
                  {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011},
  pages        = {305--312},
  publisher    = {Omnipress},
  year         = {2011},
  url          = {https://icml.cc/2011/papers/222\_icmlpaper.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/TamarCM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics