BibTeX records: Shayegan Omidshafiei

download as .bib file

@article{DBLP:journals/csysl/DongOE24,
  author       = {Zihao Dong and
                  Shayegan Omidshafiei and
                  Michael Everett},
  title        = {Collision Avoidance Verification of Multiagent Systems With Learned
                  Policies},
  journal      = {{IEEE} Control. Syst. Lett.},
  volume       = {8},
  pages        = {652--657},
  year         = {2024},
  url          = {https://doi.org/10.1109/LCSYS.2024.3400190},
  doi          = {10.1109/LCSYS.2024.3400190},
  timestamp    = {Tue, 18 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/csysl/DongOE24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/WuCKRSSDTOCCJH24,
  author       = {Yusong Wu and
                  Tim Cooijmans and
                  Kyle Kastner and
                  Adam Roberts and
                  Ian Simon and
                  Alexander Scarlatos and
                  Chris Donahue and
                  Cassie Tarakajian and
                  Shayegan Omidshafiei and
                  Aaron C. Courville and
                  Pablo Samuel Castro and
                  Natasha Jaques and
                  Cheng{-}Zhi Anna Huang},
  title        = {Adaptive Accompaniment with ReaLchords},
  booktitle    = {Forty-first International Conference on Machine Learning, {ICML} 2024,
                  Vienna, Austria, July 21-27, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=mUVydzrkgz},
  timestamp    = {Mon, 02 Sep 2024 16:45:29 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/WuCKRSSDTOCCJH24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-03314,
  author       = {Zihao Dong and
                  Shayegan Omidshafiei and
                  Michael Everett},
  title        = {Collision Avoidance Verification of Multiagent Systems with Learned
                  Policies},
  journal      = {CoRR},
  volume       = {abs/2403.03314},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.03314},
  doi          = {10.48550/ARXIV.2403.03314},
  eprinttype    = {arXiv},
  eprint       = {2403.03314},
  timestamp    = {Wed, 03 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-03314.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-16807,
  author       = {Katherine M. Collins and
                  Najoung Kim and
                  Yonatan Bitton and
                  Verena Rieser and
                  Shayegan Omidshafiei and
                  Yushi Hu and
                  Sherol Chen and
                  Senjuti Dutta and
                  Minsuk Chang and
                  Kimin Lee and
                  Youwei Liang and
                  Georgina Evans and
                  Sahil Singla and
                  Gang Li and
                  Adrian Weller and
                  Junfeng He and
                  Deepak Ramachandran and
                  Krishnamurthy Dj Dvijotham},
  title        = {Beyond Thumbs Up/Down: Untangling Challenges of Fine-Grained Feedback
                  for Text-to-Image Generation},
  journal      = {CoRR},
  volume       = {abs/2406.16807},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.16807},
  doi          = {10.48550/ARXIV.2406.16807},
  eprinttype    = {arXiv},
  eprint       = {2406.16807},
  timestamp    = {Mon, 22 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-16807.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csysl/EverettBO23,
  author       = {Michael Everett and
                  Rudy Bunel and
                  Shayegan Omidshafiei},
  title        = {{DRIP:} Domain Refinement Iteration With Polytopes for Backward Reachability
                  Analysis of Neural Feedback Loops},
  journal      = {{IEEE} Control. Syst. Lett.},
  volume       = {7},
  pages        = {1622--1627},
  year         = {2023},
  url          = {https://doi.org/10.1109/LCSYS.2023.3260731},
  doi          = {10.1109/LCSYS.2023.3260731},
  timestamp    = {Fri, 02 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/csysl/EverettBO23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-04623,
  author       = {Atsushi Ueshima and
                  Shayegan Omidshafiei and
                  Hirokazu Shirado},
  title        = {Deconstructing Cooperation and Ostracism via Multi-Agent Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2310.04623},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.04623},
  doi          = {10.48550/ARXIV.2310.04623},
  eprinttype    = {arXiv},
  eprint       = {2310.04623},
  timestamp    = {Fri, 20 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-04623.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/PiliourasROEHCT22,
  author       = {Georgios Piliouras and
                  Mark Rowland and
                  Shayegan Omidshafiei and
                  Romuald Elie and
                  Daniel Hennes and
                  Jerome T. Connor and
                  Karl Tuyls},
  title        = {Evolutionary Dynamics and Phi-Regret Minimization in Games},
  journal      = {J. Artif. Intell. Res.},
  volume       = {74},
  pages        = {1125--1158},
  year         = {2022},
  url          = {https://doi.org/10.1613/jair.1.13187},
  doi          = {10.1613/JAIR.1.13187},
  timestamp    = {Mon, 25 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jair/PiliourasROEHCT22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/scirobotics/LiuLWMEHCTOASHM22,
  author       = {Siqi Liu and
                  Guy Lever and
                  Zhe Wang and
                  Josh Merel and
                  S. M. Ali Eslami and
                  Daniel Hennes and
                  Wojciech M. Czarnecki and
                  Yuval Tassa and
                  Shayegan Omidshafiei and
                  Abbas Abdolmaleki and
                  Noah Y. Siegel and
                  Leonard Hasenclever and
                  Luke Marris and
                  Saran Tunyasuvunakool and
                  H. Francis Song and
                  Markus Wulfmeier and
                  Paul Muller and
                  Tuomas Haarnoja and
                  Brendan D. Tracey and
                  Karl Tuyls and
                  Thore Graepel and
                  Nicolas Heess},
  title        = {From motor control to team play in simulated humanoid football},
  journal      = {Sci. Robotics},
  volume       = {7},
  number       = {69},
  year         = {2022},
  url          = {https://doi.org/10.1126/scirobotics.abo0235},
  doi          = {10.1126/SCIROBOTICS.ABO0235},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/scirobotics/LiuLWMEHCTOASHM22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/OmidshafieiKADK22,
  author       = {Shayegan Omidshafiei and
                  Andrei Kapishnikov and
                  Yannick Assogba and
                  Lucas Dixon and
                  Been Kim},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Beyond Rewards: a Hierarchical Perspective on Offline Multiagent Behavioral
                  Analysis},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/1663fba7b56da1e96bed6e30546a07b0-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/OmidshafieiKADK22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-09046,
  author       = {Shayegan Omidshafiei and
                  Andrei Kapishnikov and
                  Yannick Assogba and
                  Lucas Dixon and
                  Been Kim},
  title        = {Beyond Rewards: a Hierarchical Perspective on Offline Multiagent Behavioral
                  Analysis},
  journal      = {CoRR},
  volume       = {abs/2206.09046},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.09046},
  doi          = {10.48550/ARXIV.2206.09046},
  eprinttype    = {arXiv},
  eprint       = {2206.09046},
  timestamp    = {Mon, 27 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-09046.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-15378,
  author       = {Julien P{\'{e}}rolat and
                  Bart De Vylder and
                  Daniel Hennes and
                  Eugene Tarassov and
                  Florian Strub and
                  Vincent de Boer and
                  Paul Muller and
                  Jerome T. Connor and
                  Neil Burch and
                  Thomas W. Anthony and
                  Stephen McAleer and
                  Romuald Elie and
                  Sarah H. Cen and
                  Zhe Wang and
                  Audrunas Gruslys and
                  Aleksandra Malysheva and
                  Mina Khan and
                  Sherjil Ozair and
                  Finbarr Timbers and
                  Toby Pohlen and
                  Tom Eccles and
                  Mark Rowland and
                  Marc Lanctot and
                  Jean{-}Baptiste Lespiau and
                  Bilal Piot and
                  Shayegan Omidshafiei and
                  Edward Lockhart and
                  Laurent Sifre and
                  Nathalie Beauguerlange and
                  R{\'{e}}mi Munos and
                  David Silver and
                  Satinder Singh and
                  Demis Hassabis and
                  Karl Tuyls},
  title        = {Mastering the Game of Stratego with Model-Free Multiagent Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2206.15378},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.15378},
  doi          = {10.48550/ARXIV.2206.15378},
  eprinttype    = {arXiv},
  eprint       = {2206.15378},
  timestamp    = {Wed, 28 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-15378.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-02205,
  author       = {Luke Marris and
                  Marc Lanctot and
                  Ian Gemp and
                  Shayegan Omidshafiei and
                  Stephen McAleer and
                  Jerome T. Connor and
                  Karl Tuyls and
                  Thore Graepel},
  title        = {Game Theoretic Rating in N-player general-sum games with Equilibria},
  journal      = {CoRR},
  volume       = {abs/2210.02205},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.02205},
  doi          = {10.48550/ARXIV.2210.02205},
  eprinttype    = {arXiv},
  eprint       = {2210.02205},
  timestamp    = {Fri, 07 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-02205.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-16385,
  author       = {Srivatsan Krishnan and
                  Natasha Jaques and
                  Shayegan Omidshafiei and
                  Dan Zhang and
                  Izzeddin Gur and
                  Vijay Janapa Reddi and
                  Aleksandra Faust},
  title        = {Multi-Agent Reinforcement Learning for Microprocessor Design Space
                  Exploration},
  journal      = {CoRR},
  volume       = {abs/2211.16385},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.16385},
  doi          = {10.48550/ARXIV.2211.16385},
  eprinttype    = {arXiv},
  eprint       = {2211.16385},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-16385.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-04646,
  author       = {Michael Everett and
                  Rudy Bunel and
                  Shayegan Omidshafiei},
  title        = {{DRIP:} Domain Refinement Iteration with Polytopes for Backward Reachability
                  Analysis of Neural Feedback Loops},
  journal      = {CoRR},
  volume       = {abs/2212.04646},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.04646},
  doi          = {10.48550/ARXIV.2212.04646},
  eprinttype    = {arXiv},
  eprint       = {2212.04646},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-04646.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/TuylsOMWCHGSWSL21,
  author       = {Karl Tuyls and
                  Shayegan Omidshafiei and
                  Paul Muller and
                  Zhe Wang and
                  Jerome T. Connor and
                  Daniel Hennes and
                  Ian Graham and
                  William Spearman and
                  Tim Waskett and
                  Dafydd Steele and
                  Pauline Luc and
                  Adri{\`{a}} Recasens and
                  Alexandre Galashov and
                  Gregory Thornton and
                  Romuald Elie and
                  Pablo Sprechmann and
                  Pol Moreno and
                  Kris Cao and
                  Marta Garnelo and
                  Praneet Dutta and
                  Michal Valko and
                  Nicolas Heess and
                  Alex Bridgland and
                  Julien P{\'{e}}rolat and
                  Bart De Vylder and
                  S. M. Ali Eslami and
                  Mark Rowland and
                  Andrew Jaegle and
                  R{\'{e}}mi Munos and
                  Trevor Back and
                  Razia Ahamed and
                  Simon Bouton and
                  Nathalie Beauguerlange and
                  Jackson Broshear and
                  Thore Graepel and
                  Demis Hassabis},
  title        = {Game Plan: What {AI} can do for Football, and What Football can do
                  for {AI}},
  journal      = {J. Artif. Intell. Res.},
  volume       = {71},
  pages        = {41--88},
  year         = {2021},
  url          = {https://doi.org/10.1613/jair.1.12505},
  doi          = {10.1613/JAIR.1.12505},
  timestamp    = {Fri, 11 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jair/TuylsOMWCHGSWSL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PerolatMLOROBAB21,
  author       = {Julien P{\'{e}}rolat and
                  R{\'{e}}mi Munos and
                  Jean{-}Baptiste Lespiau and
                  Shayegan Omidshafiei and
                  Mark Rowland and
                  Pedro A. Ortega and
                  Neil Burch and
                  Thomas W. Anthony and
                  David Balduzzi and
                  Bart De Vylder and
                  Georgios Piliouras and
                  Marc Lanctot and
                  Karl Tuyls},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {From Poincar{\'{e}} Recurrence to Convergence in Imperfect Information
                  Games: Finding Equilibrium via Regularization},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {8525--8535},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/perolat21a.html},
  timestamp    = {Wed, 28 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/PerolatMLOROBAB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-12196,
  author       = {Siqi Liu and
                  Guy Lever and
                  Zhe Wang and
                  Josh Merel and
                  S. M. Ali Eslami and
                  Daniel Hennes and
                  Wojciech M. Czarnecki and
                  Yuval Tassa and
                  Shayegan Omidshafiei and
                  Abbas Abdolmaleki and
                  Noah Y. Siegel and
                  Leonard Hasenclever and
                  Luke Marris and
                  Saran Tunyasuvunakool and
                  H. Francis Song and
                  Markus Wulfmeier and
                  Paul Muller and
                  Tuomas Haarnoja and
                  Brendan D. Tracey and
                  Karl Tuyls and
                  Thore Graepel and
                  Nicolas Heess},
  title        = {From Motor Control to Team Play in Simulated Humanoid Football},
  journal      = {CoRR},
  volume       = {abs/2105.12196},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.12196},
  eprinttype    = {arXiv},
  eprint       = {2105.12196},
  timestamp    = {Thu, 11 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-12196.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-04219,
  author       = {Shayegan Omidshafiei and
                  Daniel Hennes and
                  Marta Garnelo and
                  Eugene Tarassov and
                  Zhe Wang and
                  Romuald Elie and
                  Jerome T. Connor and
                  Paul Muller and
                  Ian Graham and
                  William Spearman and
                  Karl Tuyls},
  title        = {Time-series Imputation of Temporally-occluded Multiagent Trajectories},
  journal      = {CoRR},
  volume       = {abs/2106.04219},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.04219},
  eprinttype    = {arXiv},
  eprint       = {2106.04219},
  timestamp    = {Fri, 11 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-04219.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-14668,
  author       = {Georgios Piliouras and
                  Mark Rowland and
                  Shayegan Omidshafiei and
                  Romuald Elie and
                  Daniel Hennes and
                  Jerome T. Connor and
                  Karl Tuyls},
  title        = {Evolutionary Dynamics and {\(\Phi\)}-Regret Minimization in Games},
  journal      = {CoRR},
  volume       = {abs/2106.14668},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.14668},
  eprinttype    = {arXiv},
  eprint       = {2106.14668},
  timestamp    = {Wed, 30 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-14668.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/KimOPH20,
  author       = {Dong{-}Ki Kim and
                  Shayegan Omidshafiei and
                  Jason Pazis and
                  Jonathan P. How},
  title        = {Crossmodal attentive skill learner: learning in Atari and beyond with
                  audio-video inputs},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {34},
  number       = {1},
  pages        = {16},
  year         = {2020},
  url          = {https://doi.org/10.1007/s10458-019-09439-5},
  doi          = {10.1007/S10458-019-09439-5},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aamas/KimOPH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/HennesMOMPLGLPD20,
  author       = {Daniel Hennes and
                  Dustin Morrill and
                  Shayegan Omidshafiei and
                  R{\'{e}}mi Munos and
                  Julien P{\'{e}}rolat and
                  Marc Lanctot and
                  Audrunas Gruslys and
                  Jean{-}Baptiste Lespiau and
                  Paavo Parmas and
                  Edgar A. Du{\'{e}}{\~{n}}ez{-}Guzm{\'{a}}n and
                  Karl Tuyls},
  editor       = {Amal El Fallah Seghrouchni and
                  Gita Sukthankar and
                  Bo An and
                  Neil Yorke{-}Smith},
  title        = {Neural Replicator Dynamics: Multiagent Learning via Hedging Policy
                  Gradients},
  booktitle    = {Proceedings of the 19th International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} '20, Auckland, New Zealand, May 9-13,
                  2020},
  pages        = {492--501},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2020},
  url          = {https://dl.acm.org/doi/10.5555/3398761.3398822},
  doi          = {10.5555/3398761.3398822},
  timestamp    = {Tue, 26 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/HennesMOMPLGLPD20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/Kim0OLRHTMCH20,
  author       = {Dong{-}Ki Kim and
                  Miao Liu and
                  Shayegan Omidshafiei and
                  Sebastian Lopez{-}Cot and
                  Matthew Riemer and
                  Golnaz Habibi and
                  Gerald Tesauro and
                  Sami Mourad and
                  Murray Campbell and
                  Jonathan P. How},
  editor       = {Amal El Fallah Seghrouchni and
                  Gita Sukthankar and
                  Bo An and
                  Neil Yorke{-}Smith},
  title        = {Learning Hierarchical Teaching Policies for Cooperative Agents},
  booktitle    = {Proceedings of the 19th International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} '20, Auckland, New Zealand, May 9-13,
                  2020},
  pages        = {620--628},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2020},
  url          = {https://dl.acm.org/doi/10.5555/3398761.3398836},
  doi          = {10.5555/3398761.3398836},
  timestamp    = {Tue, 26 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/Kim0OLRHTMCH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MullerORTPLHMLH20,
  author       = {Paul Muller and
                  Shayegan Omidshafiei and
                  Mark Rowland and
                  Karl Tuyls and
                  Julien P{\'{e}}rolat and
                  Siqi Liu and
                  Daniel Hennes and
                  Luke Marris and
                  Marc Lanctot and
                  Edward Hughes and
                  Zhe Wang and
                  Guy Lever and
                  Nicolas Heess and
                  Thore Graepel and
                  R{\'{e}}mi Munos},
  title        = {A Generalized Training Approach for Multiagent Learning},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=Bkl5kxrKDr},
  timestamp    = {Thu, 11 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MullerORTPLHMLH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MunosPLRVLTHOGA20,
  author       = {R{\'{e}}mi Munos and
                  Julien P{\'{e}}rolat and
                  Jean{-}Baptiste Lespiau and
                  Mark Rowland and
                  Bart De Vylder and
                  Marc Lanctot and
                  Finbarr Timbers and
                  Daniel Hennes and
                  Shayegan Omidshafiei and
                  Audrunas Gruslys and
                  Mohammad Gheshlaghi Azar and
                  Edward Lockhart and
                  Karl Tuyls},
  title        = {Fast computation of Nash Equilibria in Imperfect Information Games},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {7119--7129},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/munos20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/MunosPLRVLTHOGA20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/CzarneckiGTTOBJ20,
  author       = {Wojciech M. Czarnecki and
                  Gauthier Gidel and
                  Brendan D. Tracey and
                  Karl Tuyls and
                  Shayegan Omidshafiei and
                  David Balduzzi and
                  Max Jaderberg},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Real World Games Look Like Spinning Tops},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/ca172e964907a97d5ebd876bfdd4adbd-Abstract.html},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/CzarneckiGTTOBJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-08456,
  author       = {Julien P{\'{e}}rolat and
                  R{\'{e}}mi Munos and
                  Jean{-}Baptiste Lespiau and
                  Shayegan Omidshafiei and
                  Mark Rowland and
                  Pedro A. Ortega and
                  Neil Burch and
                  Thomas W. Anthony and
                  David Balduzzi and
                  Bart De Vylder and
                  Georgios Piliouras and
                  Marc Lanctot and
                  Karl Tuyls},
  title        = {From Poincar{\'{e}} Recurrence to Convergence in Imperfect Information
                  Games: Finding Equilibrium via Regularization},
  journal      = {CoRR},
  volume       = {abs/2002.08456},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.08456},
  eprinttype    = {arXiv},
  eprint       = {2002.08456},
  timestamp    = {Wed, 28 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-08456.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-09468,
  author       = {Wojciech Marian Czarnecki and
                  Gauthier Gidel and
                  Brendan D. Tracey and
                  Karl Tuyls and
                  Shayegan Omidshafiei and
                  David Balduzzi and
                  Max Jaderberg},
  title        = {Real World Games Look Like Spinning Tops},
  journal      = {CoRR},
  volume       = {abs/2004.09468},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.09468},
  eprinttype    = {arXiv},
  eprint       = {2004.09468},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-09468.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-01642,
  author       = {Shayegan Omidshafiei and
                  Karl Tuyls and
                  Wojciech M. Czarnecki and
                  Francisco C. Santos and
                  Mark Rowland and
                  Jerome T. Connor and
                  Daniel Hennes and
                  Paul Muller and
                  Julien P{\'{e}}rolat and
                  Bart De Vylder and
                  Audrunas Gruslys and
                  R{\'{e}}mi Munos},
  title        = {Navigating the Landscape of Games},
  journal      = {CoRR},
  volume       = {abs/2005.01642},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.01642},
  eprinttype    = {arXiv},
  eprint       = {2005.01642},
  timestamp    = {Fri, 11 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-01642.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-09192,
  author       = {Karl Tuyls and
                  Shayegan Omidshafiei and
                  Paul Muller and
                  Zhe Wang and
                  Jerome T. Connor and
                  Daniel Hennes and
                  Ian Graham and
                  William Spearman and
                  Tim Waskett and
                  Dafydd Steele and
                  Pauline Luc and
                  Adri{\`{a}} Recasens and
                  Alexandre Galashov and
                  Gregory Thornton and
                  Romuald Elie and
                  Pablo Sprechmann and
                  Pol Moreno and
                  Kris Cao and
                  Marta Garnelo and
                  Praneet Dutta and
                  Michal Valko and
                  Nicolas Heess and
                  Alex Bridgland and
                  Julien P{\'{e}}rolat and
                  Bart De Vylder and
                  S. M. Ali Eslami and
                  Mark Rowland and
                  Andrew Jaegle and
                  R{\'{e}}mi Munos and
                  Trevor Back and
                  Razia Ahamed and
                  Simon Bouton and
                  Nathalie Beauguerlange and
                  Jackson Broshear and
                  Thore Graepel and
                  Demis Hassabis},
  title        = {Game Plan: What {AI} can do for Football, and What Football can do
                  for {AI}},
  journal      = {CoRR},
  volume       = {abs/2011.09192},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.09192},
  eprinttype    = {arXiv},
  eprint       = {2011.09192},
  timestamp    = {Fri, 11 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-09192.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/OmidshafieiKLTR19,
  author       = {Shayegan Omidshafiei and
                  Dong{-}Ki Kim and
                  Miao Liu and
                  Gerald Tesauro and
                  Matthew Riemer and
                  Christopher Amato and
                  Murray Campbell and
                  Jonathan P. How},
  title        = {Learning to Teach in Cooperative Multiagent Reinforcement Learning},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {6128--6136},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33016128},
  doi          = {10.1609/AAAI.V33I01.33016128},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/OmidshafieiKLTR19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/WadhwaniaKOH19,
  author       = {Samir Wadhwania and
                  Dong{-}Ki Kim and
                  Shayegan Omidshafiei and
                  Jonathan P. How},
  title        = {Policy Distillation and Value Matching in Multiagent Reinforcement
                  Learning},
  booktitle    = {2019 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2019, Macau, SAR, China, November 3-8, 2019},
  pages        = {8193--8200},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/IROS40897.2019.8967849},
  doi          = {10.1109/IROS40897.2019.8967849},
  timestamp    = {Fri, 31 Jan 2020 10:27:14 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/WadhwaniaKOH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RowlandOTPVPM19,
  author       = {Mark Rowland and
                  Shayegan Omidshafiei and
                  Karl Tuyls and
                  Julien P{\'{e}}rolat and
                  Michal Valko and
                  Georgios Piliouras and
                  R{\'{e}}mi Munos},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Multiagent Evaluation under Incomplete Information},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {12270--12282},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/510f2318f324cf07fce24c3a4b89c771-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/RowlandOTPVPM19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-01373,
  author       = {Shayegan Omidshafiei and
                  Christos H. Papadimitriou and
                  Georgios Piliouras and
                  Karl Tuyls and
                  Mark Rowland and
                  Jean{-}Baptiste Lespiau and
                  Wojciech M. Czarnecki and
                  Marc Lanctot and
                  Julien P{\'{e}}rolat and
                  R{\'{e}}mi Munos},
  title        = {{\(\alpha\)}-Rank: Multi-Agent Evaluation by Evolution},
  journal      = {CoRR},
  volume       = {abs/1903.01373},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.01373},
  eprinttype    = {arXiv},
  eprint       = {1903.01373},
  timestamp    = {Tue, 28 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-01373.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-03216,
  author       = {Dong{-}Ki Kim and
                  Miao Liu and
                  Shayegan Omidshafiei and
                  Sebastian Lopez{-}Cot and
                  Matthew Riemer and
                  Golnaz Habibi and
                  Gerald Tesauro and
                  Sami Mourad and
                  Murray Campbell and
                  Jonathan P. How},
  title        = {Learning Hierarchical Teaching in Cooperative Multiagent Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1903.03216},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.03216},
  eprinttype    = {arXiv},
  eprint       = {1903.03216},
  timestamp    = {Thu, 12 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-03216.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-06592,
  author       = {Samir Wadhwania and
                  Dong{-}Ki Kim and
                  Shayegan Omidshafiei and
                  Jonathan P. How},
  title        = {Policy Distillation and Value Matching in Multiagent Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1903.06592},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.06592},
  eprinttype    = {arXiv},
  eprint       = {1903.06592},
  timestamp    = {Mon, 01 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-06592.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-00190,
  author       = {Shayegan Omidshafiei and
                  Daniel Hennes and
                  Dustin Morrill and
                  R{\'{e}}mi Munos and
                  Julien P{\'{e}}rolat and
                  Marc Lanctot and
                  Audrunas Gruslys and
                  Jean{-}Baptiste Lespiau and
                  Karl Tuyls},
  title        = {Neural Replicator Dynamics},
  journal      = {CoRR},
  volume       = {abs/1906.00190},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.00190},
  eprinttype    = {arXiv},
  eprint       = {1906.00190},
  timestamp    = {Thu, 13 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-00190.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-09453,
  author       = {Marc Lanctot and
                  Edward Lockhart and
                  Jean{-}Baptiste Lespiau and
                  Vin{\'{\i}}cius Flores Zambaldi and
                  Satyaki Upadhyay and
                  Julien P{\'{e}}rolat and
                  Sriram Srinivasan and
                  Finbarr Timbers and
                  Karl Tuyls and
                  Shayegan Omidshafiei and
                  Daniel Hennes and
                  Dustin Morrill and
                  Paul Muller and
                  Timo Ewalds and
                  Ryan Faulkner and
                  J{\'{a}}nos Kram{\'{a}}r and
                  Bart De Vylder and
                  Brennan Saeta and
                  James Bradbury and
                  David Ding and
                  Sebastian Borgeaud and
                  Matthew Lai and
                  Julian Schrittwieser and
                  Thomas W. Anthony and
                  Edward Hughes and
                  Ivo Danihelka and
                  Jonah Ryan{-}Davis},
  title        = {OpenSpiel: {A} Framework for Reinforcement Learning in Games},
  journal      = {CoRR},
  volume       = {abs/1908.09453},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.09453},
  eprinttype    = {arXiv},
  eprint       = {1908.09453},
  timestamp    = {Tue, 18 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-09453.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-09849,
  author       = {Mark Rowland and
                  Shayegan Omidshafiei and
                  Karl Tuyls and
                  Julien P{\'{e}}rolat and
                  Michal Valko and
                  Georgios Piliouras and
                  R{\'{e}}mi Munos},
  title        = {Multiagent Evaluation under Incomplete Information},
  journal      = {CoRR},
  volume       = {abs/1909.09849},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.09849},
  eprinttype    = {arXiv},
  eprint       = {1909.09849},
  timestamp    = {Fri, 27 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-09849.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-12823,
  author       = {Paul Muller and
                  Shayegan Omidshafiei and
                  Mark Rowland and
                  Karl Tuyls and
                  Julien P{\'{e}}rolat and
                  Siqi Liu and
                  Daniel Hennes and
                  Luke Marris and
                  Marc Lanctot and
                  Edward Hughes and
                  Zhe Wang and
                  Guy Lever and
                  Nicolas Heess and
                  Thore Graepel and
                  R{\'{e}}mi Munos},
  title        = {A Generalized Training Approach for Multiagent Learning},
  journal      = {CoRR},
  volume       = {abs/1909.12823},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.12823},
  eprinttype    = {arXiv},
  eprint       = {1909.12823},
  timestamp    = {Thu, 11 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-12823.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/OmidshafieiKPH18,
  author       = {Shayegan Omidshafiei and
                  Dong{-}Ki Kim and
                  Jason Pazis and
                  Jonathan P. How},
  editor       = {Elisabeth Andr{\'{e}} and
                  Sven Koenig and
                  Mehdi Dastani and
                  Gita Sukthankar},
  title        = {Crossmodal Attentive Skill Learner},
  booktitle    = {Proceedings of the 17th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} 2018, Stockholm, Sweden, July 10-15,
                  2018},
  pages        = {139--146},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems
                  Richland, SC, {USA} / {ACM}},
  year         = {2018},
  url          = {http://dl.acm.org/citation.cfm?id=3237410},
  timestamp    = {Sat, 30 Sep 2023 09:34:53 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/OmidshafieiKPH18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-07830,
  author       = {Shayegan Omidshafiei and
                  Dong{-}Ki Kim and
                  Miao Liu and
                  Gerald Tesauro and
                  Matthew Riemer and
                  Christopher Amato and
                  Murray Campbell and
                  Jonathan P. How},
  title        = {Learning to Teach in Cooperative Multiagent Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1805.07830},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.07830},
  eprinttype    = {arXiv},
  eprint       = {1805.07830},
  timestamp    = {Mon, 05 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-07830.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijrr/OmidshafieiAALH17,
  author       = {Shayegan Omidshafiei and
                  Ali{-}Akbar Agha{-}Mohammadi and
                  Christopher Amato and
                  Shih{-}Yuan Liu and
                  Jonathan P. How and
                  John Vian},
  title        = {Decentralized control of multi-robot partially observable Markov decision
                  processes using belief space macro-actions},
  journal      = {Int. J. Robotics Res.},
  volume       = {36},
  number       = {2},
  pages        = {231--258},
  year         = {2017},
  url          = {https://doi.org/10.1177/0278364917692864},
  doi          = {10.1177/0278364917692864},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijrr/OmidshafieiAALH17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/OmidshafieiPAHV17,
  author       = {Shayegan Omidshafiei and
                  Jason Pazis and
                  Christopher Amato and
                  Jonathan P. How and
                  John Vian},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Deep Decentralized Multi-task Multi-Agent Reinforcement Learning under
                  Partial Observability},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {2681--2690},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/omidshafiei17a.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/OmidshafieiPAHV17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/OmidshafieiALEH17,
  author       = {Shayegan Omidshafiei and
                  Christopher Amato and
                  Miao Liu and
                  Michael Everett and
                  Jonathan P. How and
                  John Vian},
  title        = {Scalable accelerated decentralized multi-robot policy search in continuous
                  observation spaces},
  booktitle    = {2017 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2017, Singapore, Singapore, May 29 - June 3, 2017},
  pages        = {863--870},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICRA.2017.7989106},
  doi          = {10.1109/ICRA.2017.7989106},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/OmidshafieiALEH17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/OmidshafieiLELA17,
  author       = {Shayegan Omidshafiei and
                  Shih{-}Yuan Liu and
                  Michael Everett and
                  Brett Thomas Lopez and
                  Christopher Amato and
                  Miao Liu and
                  Jonathan P. How and
                  John Vian},
  title        = {Semantic-level decentralized multi-robot decision-making using probabilistic
                  macro-observations},
  booktitle    = {2017 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2017, Singapore, Singapore, May 29 - June 3, 2017},
  pages        = {871--878},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICRA.2017.7989107},
  doi          = {10.1109/ICRA.2017.7989107},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/OmidshafieiLELA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/LiuSOAH17,
  author       = {Miao Liu and
                  Kavinayan Sivakumar and
                  Shayegan Omidshafiei and
                  Christopher Amato and
                  Jonathan P. How},
  title        = {Learning for multi-robot cooperation in partially observable stochastic
                  environments with macro-actions},
  booktitle    = {2017 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2017, Vancouver, BC, Canada, September 24-28, 2017},
  pages        = {1853--1860},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/IROS.2017.8206001},
  doi          = {10.1109/IROS.2017.8206001},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/LiuSOAH17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/OmidshafieiLELA17,
  author       = {Shayegan Omidshafiei and
                  Shih{-}Yuan Liu and
                  Michael Everett and
                  Brett Thomas Lopez and
                  Christopher Amato and
                  Miao Liu and
                  Jonathan P. How and
                  John Vian},
  title        = {Semantic-level Decentralized Multi-Robot Decision-Making using Probabilistic
                  Macro-Observations},
  journal      = {CoRR},
  volume       = {abs/1703.05623},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.05623},
  eprinttype    = {arXiv},
  eprint       = {1703.05623},
  timestamp    = {Tue, 06 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OmidshafieiLELA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/OmidshafieiALEH17,
  author       = {Shayegan Omidshafiei and
                  Christopher Amato and
                  Miao Liu and
                  Michael Everett and
                  Jonathan P. How and
                  John Vian},
  title        = {Scalable Accelerated Decentralized Multi-Robot Policy Search in Continuous
                  Observation Spaces},
  journal      = {CoRR},
  volume       = {abs/1703.05626},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.05626},
  eprinttype    = {arXiv},
  eprint       = {1703.05626},
  timestamp    = {Mon, 05 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OmidshafieiALEH17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/OmidshafieiPAHV17,
  author       = {Shayegan Omidshafiei and
                  Jason Pazis and
                  Christopher Amato and
                  Jonathan P. How and
                  John Vian},
  title        = {Deep Decentralized Multi-task Multi-Agent Reinforcement Learning under
                  Partial Observability},
  journal      = {CoRR},
  volume       = {abs/1703.06182},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.06182},
  eprinttype    = {arXiv},
  eprint       = {1703.06182},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OmidshafieiPAHV17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LiuSOAH17,
  author       = {Miao Liu and
                  Kavinayan Sivakumar and
                  Shayegan Omidshafiei and
                  Christopher Amato and
                  Jonathan P. How},
  title        = {Learning for Multi-robot Cooperation in Partially Observable Stochastic
                  Environments with Macro-actions},
  journal      = {CoRR},
  volume       = {abs/1707.07399},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.07399},
  eprinttype    = {arXiv},
  eprint       = {1707.07399},
  timestamp    = {Mon, 05 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LiuSOAH17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-10314,
  author       = {Shayegan Omidshafiei and
                  Dong{-}Ki Kim and
                  Jason Pazis and
                  Jonathan P. How},
  title        = {Crossmodal Attentive Skill Learner},
  journal      = {CoRR},
  volume       = {abs/1711.10314},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.10314},
  eprinttype    = {arXiv},
  eprint       = {1711.10314},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-10314.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/automatica/WeiLZFLKOH16,
  author       = {Hongchuan Wei and
                  Wenjie Lu and
                  Pingping Zhu and
                  Silvia Ferrari and
                  Miao Liu and
                  Robert H. Klein and
                  Shayegan Omidshafiei and
                  Jonathan P. How},
  title        = {Information value in nonparametric Dirichlet-process Gaussian-process
                  {(DPGP)} mixture models},
  journal      = {Autom.},
  volume       = {74},
  pages        = {360--368},
  year         = {2016},
  url          = {https://doi.org/10.1016/j.automatica.2016.07.018},
  doi          = {10.1016/J.AUTOMATICA.2016.07.018},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/automatica/WeiLZFLKOH16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/OmidshafieiAALH16,
  author       = {Shayegan Omidshafiei and
                  Ali{-}akbar Agha{-}mohammadi and
                  Christopher Amato and
                  Shih{-}Yuan Liu and
                  Jonathan P. How and
                  John Vian},
  editor       = {Danica Kragic and
                  Antonio Bicchi and
                  Alessandro De Luca},
  title        = {Graph-based Cross Entropy method for solving multi-robot decentralized
                  POMDPs},
  booktitle    = {2016 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2016, Stockholm, Sweden, May 16-21, 2016},
  pages        = {5395--5402},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICRA.2016.7487751},
  doi          = {10.1109/ICRA.2016.7487751},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/OmidshafieiAALH16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/OmidshafieiLHV16,
  author       = {Shayegan Omidshafiei and
                  Brett Thomas Lopez and
                  Jonathan P. How and
                  John Vian},
  title        = {Hierarchical Bayesian Noise Inference for Robust Real-time Probabilistic
                  Object Classification},
  journal      = {CoRR},
  volume       = {abs/1605.01042},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.01042},
  eprinttype    = {arXiv},
  eprint       = {1605.01042},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OmidshafieiLHV16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/AmatoKOAHK15,
  author       = {Christopher Amato and
                  George Dimitri Konidaris and
                  Shayegan Omidshafiei and
                  Ali{-}akbar Agha{-}mohammadi and
                  Jonathan P. How and
                  Leslie Pack Kaelbling},
  title        = {Probabilistic Planning for Decentralized Multi-Robot Systems},
  booktitle    = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14,
                  2015},
  pages        = {10--12},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11655},
  timestamp    = {Tue, 19 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaifs/AmatoKOAHK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/OmidshafieiAAH15,
  author       = {Shayegan Omidshafiei and
                  Ali{-}akbar Agha{-}mohammadi and
                  Christopher Amato and
                  Jonathan P. How},
  title        = {Decentralized control of Partially Observable Markov Decision Processes
                  using belief space macro-actions},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2015, Seattle, WA, USA, 26-30 May, 2015},
  pages        = {5962--5969},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICRA.2015.7140035},
  doi          = {10.1109/ICRA.2015.7140035},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/OmidshafieiAAH15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/UreOLAHV15,
  author       = {N. Kemal Ure and
                  Shayegan Omidshafiei and
                  Brett Thomas Lopez and
                  Ali{-}akbar Agha{-}mohammadi and
                  Jonathan P. How and
                  John Vian},
  title        = {Online heterogeneous multiagent learning under limited communication
                  with applications to forest fire management},
  booktitle    = {2015 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2015, Hamburg, Germany, September 28 - October 2,
                  2015},
  pages        = {5181--5188},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/IROS.2015.7354107},
  doi          = {10.1109/IROS.2015.7354107},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/UreOLAHV15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/OmidshafieiAAH15,
  author       = {Shayegan Omidshafiei and
                  Ali{-}akbar Agha{-}mohammadi and
                  Christopher Amato and
                  Jonathan P. How},
  title        = {Decentralized Control of Partially Observable Markov Decision Processes
                  using Belief Space Macro-actions},
  journal      = {CoRR},
  volume       = {abs/1502.06030},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.06030},
  eprinttype    = {arXiv},
  eprint       = {1502.06030},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OmidshafieiAAH15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/WeiLZFKOH14,
  author       = {Hongchuan Wei and
                  Wenjie Lu and
                  Pingping Zhu and
                  Silvia Ferrari and
                  Robert H. Klein and
                  Shayegan Omidshafiei and
                  Jonathan P. How},
  title        = {Camera control for learning nonlinear target dynamics via Bayesian
                  nonparametric Dirichlet-process Gaussian-process {(DP-GP)} models},
  booktitle    = {2014 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2014, Chicago, IL, USA, September 14-18, 2014},
  pages        = {95--102},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/IROS.2014.6942546},
  doi          = {10.1109/IROS.2014.6942546},
  timestamp    = {Tue, 05 Sep 2023 15:07:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/WeiLZFKOH14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}