BibTeX records: Stefano V. Albrecht

download as .bib file

@inproceedings{DBLP:conf/aaai/AzranDAK24,
  author       = {Guy Azran and
                  Mohamad H. Danesh and
                  Stefano V. Albrecht and
                  Sarah Keren},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Contextual Pre-planning on Reward Machine Abstractions for Enhanced
                  Transfer in Deep Reinforcement Learning},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {10953--10961},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i10.28970},
  doi          = {10.1609/AAAI.V38I10.28970},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AzranDAK24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/FosongRCA24,
  author       = {Elliot Fosong and
                  Arrasy Rahman and
                  Ignacio Carlucho and
                  Stefano V. Albrecht},
  editor       = {Mehdi Dastani and
                  Jaime Sim{\~{a}}o Sichman and
                  Natasha Alechina and
                  Virginia Dignum},
  title        = {Learning Complex Teamwork Tasks using a Given Sub-task Decomposition},
  booktitle    = {Proceedings of the 23rd International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2024, Auckland, New Zealand, May 6-10,
                  2024},
  pages        = {598--606},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://dl.acm.org/doi/10.5555/3635637.3662911},
  doi          = {10.5555/3635637.3662911},
  timestamp    = {Fri, 03 May 2024 14:27:55 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/FosongRCA24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/GyevnarWLCA24,
  author       = {Balint Gyevnar and
                  Cheng Wang and
                  Christopher G. Lucas and
                  Shay B. Cohen and
                  Stefano V. Albrecht},
  editor       = {Mehdi Dastani and
                  Jaime Sim{\~{a}}o Sichman and
                  Natasha Alechina and
                  Virginia Dignum},
  title        = {Causal Explanations for Sequential Decision-Making in Multi-Agent
                  Systems},
  booktitle    = {Proceedings of the 23rd International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2024, Auckland, New Zealand, May 6-10,
                  2024},
  pages        = {771--779},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://dl.acm.org/doi/10.5555/3635637.3662930},
  doi          = {10.5555/3635637.3662930},
  timestamp    = {Fri, 03 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/GyevnarWLCA24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-08808,
  author       = {Shangmin Guo and
                  Yi Ren and
                  Stefano V. Albrecht and
                  Kenny Smith},
  title        = {Sample Relationship from Learning Dynamics Matters for Generalisation},
  journal      = {CoRR},
  volume       = {abs/2401.08808},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.08808},
  doi          = {10.48550/ARXIV.2401.08808},
  eprinttype    = {arXiv},
  eprint       = {2401.08808},
  timestamp    = {Thu, 01 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-08808.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-03479,
  author       = {Samuel Garcin and
                  James Doran and
                  Shangmin Guo and
                  Christopher G. Lucas and
                  Stefano V. Albrecht},
  title        = {{ICED:} Zero-Shot Transfer in Reinforcement Learning via In-Context
                  Environment Design},
  journal      = {CoRR},
  volume       = {abs/2402.03479},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.03479},
  doi          = {10.48550/ARXIV.2402.03479},
  eprinttype    = {arXiv},
  eprint       = {2402.03479},
  timestamp    = {Mon, 12 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-03479.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-10086,
  author       = {Anton Kuznietsov and
                  Balint Gyevnar and
                  Cheng Wang and
                  Steven Peters and
                  Stefano V. Albrecht},
  title        = {Explainable {AI} for Safe and Trustworthy Autonomous Driving: {A}
                  Systematic Review},
  journal      = {CoRR},
  volume       = {abs/2402.10086},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.10086},
  doi          = {10.48550/ARXIV.2402.10086},
  eprinttype    = {arXiv},
  eprint       = {2402.10086},
  timestamp    = {Tue, 20 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-10086.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/KnittelHARR23,
  author       = {Anthony Knittel and
                  Majd Hawasly and
                  Stefano V. Albrecht and
                  John Redford and
                  Subramanian Ramamoorthy},
  title        = {DiPA: Probabilistic Multi-Modal Interactive Prediction for Autonomous
                  Driving},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {8},
  number       = {8},
  pages        = {4887--4894},
  year         = {2023},
  url          = {https://doi.org/10.1109/LRA.2023.3284355},
  doi          = {10.1109/LRA.2023.3284355},
  timestamp    = {Sat, 05 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ral/KnittelHARR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/DunionMLHA23,
  author       = {Mhairi Dunion and
                  Trevor McInroe and
                  Kevin Sebastian Luck and
                  Josiah P. Hanna and
                  Stefano V. Albrecht},
  title        = {Temporal Disentanglement of Representations for Improved Generalisation
                  in Reinforcement Learning},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=sPgP6aISLTD},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/DunionMLHA23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/ChristianosKIAP23,
  author       = {Filippos Christianos and
                  P{\'{e}}ter Karkus and
                  Boris Ivanovic and
                  Stefano V. Albrecht and
                  Marco Pavone},
  title        = {Planning with Occluded Traffic Agents using Bi-Level Variational Occlusion
                  Models},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2023, London, UK, May 29 - June 2, 2023},
  pages        = {5558--5565},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICRA48891.2023.10160604},
  doi          = {10.1109/ICRA48891.2023.10160604},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/ChristianosKIAP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/BrewittT0A23,
  author       = {Cillian Brewitt and
                  Massimiliano Tamborski and
                  Cheng Wang and
                  Stefano V. Albrecht},
  title        = {Verifiable Goal Recognition for Autonomous Driving with Occlusions},
  booktitle    = {{IROS}},
  pages        = {11210--11217},
  year         = {2023},
  url          = {https://doi.org/10.1109/IROS55552.2023.10342386},
  doi          = {10.1109/IROS55552.2023.10342386},
  timestamp    = {Fri, 05 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/BrewittT0A23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DunionMLHA23,
  author       = {Mhairi Dunion and
                  Trevor McInroe and
                  Kevin Sebastian Luck and
                  Josiah Hanna and
                  Stefano V. Albrecht},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Conditional Mutual Information for Disentangled Representations in
                  Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/fd750154df5f199f94df897975621306-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DunionMLHA23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-03439,
  author       = {Lukas Sch{\"{a}}fer and
                  Oliver Slumbers and
                  Stephen McAleer and
                  Yali Du and
                  Stefano V. Albrecht and
                  David Mguni},
  title        = {Ensemble Value Functions for Efficient Exploration in Multi-Agent
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2302.03439},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.03439},
  doi          = {10.48550/ARXIV.2302.03439},
  eprinttype    = {arXiv},
  eprint       = {2302.03439},
  timestamp    = {Fri, 12 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-03439.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-04944,
  author       = {Elliot Fosong and
                  Arrasy Rahman and
                  Ignacio Carlucho and
                  Stefano V. Albrecht},
  title        = {Learning Complex Teamwork Tasks using a Sub-task Curriculum},
  journal      = {CoRR},
  volume       = {abs/2302.04944},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.04944},
  doi          = {10.48550/ARXIV.2302.04944},
  eprinttype    = {arXiv},
  eprint       = {2302.04944},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-04944.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-10809,
  author       = {Balint Gyevnar and
                  Cheng Wang and
                  Christopher G. Lucas and
                  Shay B. Cohen and
                  Stefano V. Albrecht},
  title        = {Causal Social Explanations for Stochastic Sequential Multi-Agent Decision-Making},
  journal      = {CoRR},
  volume       = {abs/2302.10809},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.10809},
  doi          = {10.48550/ARXIV.2302.10809},
  eprinttype    = {arXiv},
  eprint       = {2302.10809},
  timestamp    = {Mon, 22 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-10809.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-11793,
  author       = {Callum Rhys Tilbury and
                  Filippos Christianos and
                  Stefano V. Albrecht},
  title        = {Revisiting the Gumbel-Softmax in {MADDPG}},
  journal      = {CoRR},
  volume       = {abs/2302.11793},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.11793},
  doi          = {10.48550/ARXIV.2302.11793},
  eprinttype    = {arXiv},
  eprint       = {2302.11793},
  timestamp    = {Tue, 28 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-11793.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-09825,
  author       = {Alain Andres and
                  Lukas Sch{\"{a}}fer and
                  Esther Villar{-}Rodriguez and
                  Stefano V. Albrecht and
                  Javier Del Ser},
  title        = {Using Offline Data to Speed-up Reinforcement Learning in Procedurally
                  Generated Environments},
  journal      = {CoRR},
  volume       = {abs/2304.09825},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.09825},
  doi          = {10.48550/ARXIV.2304.09825},
  eprinttype    = {arXiv},
  eprint       = {2304.09825},
  timestamp    = {Mon, 24 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-09825.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-05566,
  author       = {Adam Michalski and
                  Filippos Christianos and
                  Stefano V. Albrecht},
  title        = {SMAClite: {A} Lightweight Environment for Multi-Agent Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2305.05566},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.05566},
  doi          = {10.48550/ARXIV.2305.05566},
  eprinttype    = {arXiv},
  eprint       = {2305.05566},
  timestamp    = {Mon, 15 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-05566.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-14133,
  author       = {Mhairi Dunion and
                  Trevor McInroe and
                  Kevin Sebastian Luck and
                  Josiah P. Hanna and
                  Stefano V. Albrecht},
  title        = {Conditional Mutual Information for Disentangled Representations in
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2305.14133},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14133},
  doi          = {10.48550/ARXIV.2305.14133},
  eprinttype    = {arXiv},
  eprint       = {2305.14133},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14133.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-05209,
  author       = {Guy Azran and
                  Mohamad H. Danesh and
                  Stefano V. Albrecht and
                  Sarah Keren},
  title        = {Contextual Pre-Planning on Reward Machine Abstractions for Enhanced
                  Transfer in Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2307.05209},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.05209},
  doi          = {10.48550/ARXIV.2307.05209},
  eprinttype    = {arXiv},
  eprint       = {2307.05209},
  timestamp    = {Mon, 24 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-05209.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-03494,
  author       = {Samuel Garcin and
                  James Doran and
                  Shangmin Guo and
                  Christopher G. Lucas and
                  Stefano V. Albrecht},
  title        = {How the level sampling process impacts zero-shot generalisation in
                  deep reinforcement learning},
  journal      = {CoRR},
  volume       = {abs/2310.03494},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.03494},
  doi          = {10.48550/ARXIV.2310.03494},
  eprinttype    = {arXiv},
  eprint       = {2310.03494},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-03494.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-05723,
  author       = {Trevor McInroe and
                  Stefano V. Albrecht and
                  Amos J. Storkey},
  title        = {Planning to Go Out-of-Distribution in Offline-to-Online Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2310.05723},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.05723},
  doi          = {10.48550/ARXIV.2310.05723},
  eprinttype    = {arXiv},
  eprint       = {2310.05723},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-05723.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-04736,
  author       = {Sabrina McCallum and
                  Max Taylor{-}Davies and
                  Stefano V. Albrecht and
                  Alessandro Suglia},
  title        = {Is Feedback All You Need? Leveraging Natural Language Feedback in
                  Goal-Conditioned Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2312.04736},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.04736},
  doi          = {10.48550/ARXIV.2312.04736},
  eprinttype    = {arXiv},
  eprint       = {2312.04736},
  timestamp    = {Wed, 03 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-04736.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aicom/AlbrechtW22,
  author       = {Stefano V. Albrecht and
                  Michael J. Wooldridge},
  title        = {Multi-agent systems research in the United Kingdom},
  journal      = {{AI} Commun.},
  volume       = {35},
  number       = {4},
  pages        = {269--270},
  year         = {2022},
  url          = {https://doi.org/10.3233/AIC-229003},
  doi          = {10.3233/AIC-229003},
  timestamp    = {Thu, 29 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aicom/AlbrechtW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aicom/HawaslySAARR22,
  author       = {Majd Hawasly and
                  Jonathan Sadeghi and
                  Morris Antonello and
                  Stefano V. Albrecht and
                  John Redford and
                  Subramanian Ramamoorthy},
  title        = {Perspectives on the system-level design of a safe autonomous driving
                  stack},
  journal      = {{AI} Commun.},
  volume       = {35},
  number       = {4},
  pages        = {285--294},
  year         = {2022},
  url          = {https://doi.org/10.3233/AIC-220148},
  doi          = {10.3233/AIC-220148},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aicom/HawaslySAARR22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aicom/AhmedBCCDFGGGMP22,
  author       = {Ibrahim H. Ahmed and
                  Cillian Brewitt and
                  Ignacio Carlucho and
                  Filippos Christianos and
                  Mhairi Dunion and
                  Elliot Fosong and
                  Samuel Garcin and
                  Shangmin Guo and
                  Balint Gyevnar and
                  Trevor McInroe and
                  Georgios Papoudakis and
                  Arrasy Rahman and
                  Lukas Sch{\"{a}}fer and
                  Massimiliano Tamborski and
                  Giuseppe Vecchio and
                  Cheng Wang and
                  Stefano V. Albrecht},
  title        = {Deep reinforcement learning for multi-agent interaction},
  journal      = {{AI} Commun.},
  volume       = {35},
  number       = {4},
  pages        = {357--368},
  year         = {2022},
  url          = {https://doi.org/10.3233/AIC-220116},
  doi          = {10.3233/AIC-220116},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aicom/AhmedBCCDFGGGMP22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/trob/EirasHAR22,
  author       = {Francisco Eiras and
                  Majd Hawasly and
                  Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {A Two-Stage Optimization-Based Motion Planner for Safe Urban Driving},
  journal      = {{IEEE} Trans. Robotics},
  volume       = {38},
  number       = {2},
  pages        = {822--834},
  year         = {2022},
  url          = {https://doi.org/10.1109/TRO.2021.3088009},
  doi          = {10.1109/TRO.2021.3088009},
  timestamp    = {Wed, 27 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/trob/EirasHAR22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/0001CHA22,
  author       = {Lukas Sch{\"{a}}fer and
                  Filippos Christianos and
                  Josiah P. Hanna and
                  Stefano V. Albrecht},
  editor       = {Piotr Faliszewski and
                  Viviana Mascardi and
                  Catherine Pelachaud and
                  Matthew E. Taylor},
  title        = {Decoupled Reinforcement Learning to Stabilise Intrinsically-Motivated
                  Exploration},
  booktitle    = {21st International Conference on Autonomous Agents and Multiagent
                  Systems, {AAMAS} 2022, Auckland, New Zealand, May 9-13, 2022},
  pages        = {1146--1154},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems
                  {(IFAAMAS)}},
  year         = {2022},
  url          = {https://www.ifaamas.org/Proceedings/aamas2022/pdfs/p1146.pdf},
  doi          = {10.5555/3535850.3535978},
  timestamp    = {Mon, 18 Jul 2022 17:13:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/0001CHA22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eumas/MirskyCRFMSSA22,
  author       = {Reuth Mirsky and
                  Ignacio Carlucho and
                  Arrasy Rahman and
                  Elliot Fosong and
                  William Macke and
                  Mohan Sridharan and
                  Peter Stone and
                  Stefano V. Albrecht},
  editor       = {Dorothea Baumeister and
                  J{\"{o}}rg Rothe},
  title        = {A Survey of Ad Hoc Teamwork Research},
  booktitle    = {Multi-Agent Systems - 19th European Conference, {EUMAS} 2022, D{\"{u}}sseldorf,
                  Germany, September 14-16, 2022, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {13442},
  pages        = {275--293},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-20614-6\_16},
  doi          = {10.1007/978-3-031-20614-6\_16},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eumas/MirskyCRFMSSA22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GuoRMKAS22,
  author       = {Shangmin Guo and
                  Yi Ren and
                  Kory Wallace Mathewson and
                  Simon Kirby and
                  Stefano V. Albrecht and
                  Kenny Smith},
  title        = {Expressivity of Emergent Languages is a Trade-off between Contextual
                  Complexity and Unpredictability},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=WxuE\_JWxjkW},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GuoRMKAS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/AntonelloDARR22,
  author       = {Morris Antonello and
                  Mihai Dobre and
                  Stefano V. Albrecht and
                  John Redford and
                  Subramanian Ramamoorthy},
  title        = {Flash: Fast and Light Motion Prediction for Autonomous Driving with
                  Bayesian Inverse Planning and Learned Motion Profiles},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2022, Kyoto, Japan, October 23-27, 2022},
  pages        = {9829--9836},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/IROS47612.2022.9981347},
  doi          = {10.1109/IROS47612.2022.9981347},
  timestamp    = {Tue, 03 Jan 2023 14:18:21 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/AntonelloDARR22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhongZ0AH22,
  author       = {Rujie Zhong and
                  Duohan Zhang and
                  Lukas Sch{\"{a}}fer and
                  Stefano V. Albrecht and
                  Josiah Hanna},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Robust On-Policy Sampling for Data-Efficient Policy Evaluation in
                  Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/f2dbede0879b9d04ceb30f1b8b476b27-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZhongZ0AH22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-10450,
  author       = {Reuth Mirsky and
                  Ignacio Carlucho and
                  Arrasy Rahman and
                  Elliot Fosong and
                  William Macke and
                  Mohan Sridharan and
                  Peter Stone and
                  Stefano V. Albrecht},
  title        = {A Survey of Ad Hoc Teamwork: Definitions, Methods, and Open Problems},
  journal      = {CoRR},
  volume       = {abs/2202.10450},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.10450},
  eprinttype    = {arXiv},
  eprint       = {2202.10450},
  timestamp    = {Wed, 02 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-10450.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-08251,
  author       = {Morris Antonello and
                  Mihai Dobre and
                  Stefano V. Albrecht and
                  John Redford and
                  Subramanian Ramamoorthy},
  title        = {Flash: Fast and Light Motion Prediction for Autonomous Driving with
                  Bayesian Inverse Planning and Learned Motion Profiles},
  journal      = {CoRR},
  volume       = {abs/2203.08251},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.08251},
  doi          = {10.48550/ARXIV.2203.08251},
  eprinttype    = {arXiv},
  eprint       = {2203.08251},
  timestamp    = {Mon, 28 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-08251.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-08389,
  author       = {Giuseppe Vecchio and
                  Simone Palazzo and
                  Dario C. Guastella and
                  Ignacio Carlucho and
                  Stefano V. Albrecht and
                  Giovanni Muscato and
                  Concetto Spampinato},
  title        = {{MIDGARD:} {A} Simulation Platform for Autonomous Navigation in Unstructured
                  Environments},
  journal      = {CoRR},
  volume       = {abs/2205.08389},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.08389},
  doi          = {10.48550/ARXIV.2205.08389},
  eprinttype    = {arXiv},
  eprint       = {2205.08389},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-08389.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-08783,
  author       = {Balint Gyevnar and
                  Massimiliano Tamborski and
                  Cheng Wang and
                  Christopher G. Lucas and
                  Shay B. Cohen and
                  Stefano V. Albrecht},
  title        = {A Human-Centric Method for Generating Causal Explanations in Natural
                  Language for Autonomous Vehicle Motion Planning},
  journal      = {CoRR},
  volume       = {abs/2206.08783},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.08783},
  doi          = {10.48550/ARXIV.2206.08783},
  eprinttype    = {arXiv},
  eprint       = {2206.08783},
  timestamp    = {Mon, 22 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-08783.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-11396,
  author       = {Trevor McInroe and
                  Lukas Sch{\"{a}}fer and
                  Stefano V. Albrecht},
  title        = {Learning Representations for Control with Hierarchical Forward Models},
  journal      = {CoRR},
  volume       = {abs/2206.11396},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.11396},
  doi          = {10.48550/ARXIV.2206.11396},
  eprinttype    = {arXiv},
  eprint       = {2206.11396},
  timestamp    = {Mon, 27 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-11396.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-14163,
  author       = {Cillian Brewitt and
                  Massimiliano Tamborski and
                  Stefano V. Albrecht},
  title        = {Verifiable Goal Recognition for Autonomous Driving with Occlusions},
  journal      = {CoRR},
  volume       = {abs/2206.14163},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.14163},
  doi          = {10.48550/ARXIV.2206.14163},
  eprinttype    = {arXiv},
  eprint       = {2206.14163},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-14163.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-02249,
  author       = {Lukas Sch{\"{a}}fer and
                  Filippos Christianos and
                  Amos J. Storkey and
                  Stefano V. Albrecht},
  title        = {Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2207.02249},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.02249},
  doi          = {10.48550/ARXIV.2207.02249},
  eprinttype    = {arXiv},
  eprint       = {2207.02249},
  timestamp    = {Wed, 10 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-02249.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-05480,
  author       = {Mhairi Dunion and
                  Trevor McInroe and
                  Kevin Sebastian Luck and
                  Josiah Hanna and
                  Stefano V. Albrecht},
  title        = {Temporal Disentanglement of Representations for Improved Generalisation
                  in Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2207.05480},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.05480},
  doi          = {10.48550/ARXIV.2207.05480},
  eprinttype    = {arXiv},
  eprint       = {2207.05480},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-05480.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-07498,
  author       = {Ignacio Carlucho and
                  Arrasy Rahman and
                  William Ard and
                  Elliot Fosong and
                  Corina Barbalata and
                  Stefano V. Albrecht},
  title        = {Cooperative Marine Operations via Ad Hoc Teams},
  journal      = {CoRR},
  volume       = {abs/2207.07498},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.07498},
  doi          = {10.48550/ARXIV.2207.07498},
  eprinttype    = {arXiv},
  eprint       = {2207.07498},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-07498.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-09300,
  author       = {Elliot Fosong and
                  Arrasy Rahman and
                  Ignacio Carlucho and
                  Stefano V. Albrecht},
  title        = {Few-Shot Teamwork},
  journal      = {CoRR},
  volume       = {abs/2207.09300},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.09300},
  doi          = {10.48550/ARXIV.2207.09300},
  eprinttype    = {arXiv},
  eprint       = {2207.09300},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-09300.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-14138,
  author       = {Arrasy Rahman and
                  Elliot Fosong and
                  Ignacio Carlucho and
                  Stefano V. Albrecht},
  title        = {Towards Robust Ad Hoc Teamwork Agents By Creating Diverse Training
                  Teammates},
  journal      = {CoRR},
  volume       = {abs/2207.14138},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.14138},
  doi          = {10.48550/ARXIV.2207.14138},
  eprinttype    = {arXiv},
  eprint       = {2207.14138},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-14138.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-00096,
  author       = {Majd Hawasly and
                  Jonathan Sadeghi and
                  Morris Antonello and
                  Stefano V. Albrecht and
                  John Redford and
                  Subramanian Ramamoorthy},
  title        = {Perspectives on the System-level Design of a Safe Autonomous Driving
                  Stack},
  journal      = {CoRR},
  volume       = {abs/2208.00096},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.00096},
  doi          = {10.48550/ARXIV.2208.00096},
  eprinttype    = {arXiv},
  eprint       = {2208.00096},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-00096.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-01769,
  author       = {Ibrahim H. Ahmed and
                  Cillian Brewitt and
                  Ignacio Carlucho and
                  Filippos Christianos and
                  Mhairi Dunion and
                  Elliot Fosong and
                  Samuel Garcin and
                  Shangmin Guo and
                  Balint Gyevnar and
                  Trevor McInroe and
                  Georgios Papoudakis and
                  Arrasy Rahman and
                  Lukas Sch{\"{a}}fer and
                  Massimiliano Tamborski and
                  Giuseppe Vecchio and
                  Cheng Wang and
                  Stefano V. Albrecht},
  title        = {Deep Reinforcement Learning for Multi-Agent Interaction},
  journal      = {CoRR},
  volume       = {abs/2208.01769},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.01769},
  doi          = {10.48550/ARXIV.2208.01769},
  eprinttype    = {arXiv},
  eprint       = {2208.01769},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-01769.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-14344,
  author       = {Filippos Christianos and
                  Georgios Papoudakis and
                  Stefano V. Albrecht},
  title        = {Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2209.14344},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.14344},
  doi          = {10.48550/ARXIV.2209.14344},
  eprinttype    = {arXiv},
  eprint       = {2209.14344},
  timestamp    = {Thu, 06 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-14344.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-05448,
  author       = {Arrasy Rahman and
                  Ignacio Carlucho and
                  Niklas H{\"{o}}pner and
                  Stefano V. Albrecht},
  title        = {A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based
                  Policy Learning},
  journal      = {CoRR},
  volume       = {abs/2210.05448},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.05448},
  doi          = {10.48550/ARXIV.2210.05448},
  eprinttype    = {arXiv},
  eprint       = {2210.05448},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-05448.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-06106,
  author       = {Anthony Knittel and
                  Majd Hawasly and
                  Stefano V. Albrecht and
                  John Redford and
                  Subramanian Ramamoorthy},
  title        = {DiPA: Diverse and Probabilistically Accurate Interactive Prediction},
  journal      = {CoRR},
  volume       = {abs/2210.06106},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.06106},
  doi          = {10.48550/ARXIV.2210.06106},
  eprinttype    = {arXiv},
  eprint       = {2210.06106},
  timestamp    = {Tue, 18 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-06106.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-14584,
  author       = {Filippos Christianos and
                  P{\'{e}}ter Karkus and
                  Boris Ivanovic and
                  Stefano V. Albrecht and
                  Marco Pavone},
  title        = {Planning with Occluded Traffic Agents using Bi-Level Variational Occlusion
                  Models},
  journal      = {CoRR},
  volume       = {abs/2210.14584},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.14584},
  doi          = {10.48550/ARXIV.2210.14584},
  eprinttype    = {arXiv},
  eprint       = {2210.14584},
  timestamp    = {Mon, 19 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-14584.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-11498,
  author       = {Aleksandar Krnjaic and
                  Jonathan D. Thomas and
                  Georgios Papoudakis and
                  Lukas Sch{\"{a}}fer and
                  Peter B{\"{o}}rsting and
                  Stefano V. Albrecht},
  title        = {Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics
                  with Robotic and Human Co-Workers},
  journal      = {CoRR},
  volume       = {abs/2212.11498},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.11498},
  doi          = {10.48550/ARXIV.2212.11498},
  eprinttype    = {arXiv},
  eprint       = {2212.11498},
  timestamp    = {Wed, 04 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-11498.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ChristianosPRA21,
  author       = {Filippos Christianos and
                  Georgios Papoudakis and
                  Arrasy Rahman and
                  Stefano V. Albrecht},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Scaling Multi-Agent Reinforcement Learning with Selective Parameter
                  Sharing},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {1989--1998},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/christianos21a.html},
  timestamp    = {Wed, 28 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ChristianosPRA21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RahmanHCA21,
  author       = {Arrasy Rahman and
                  Niklas H{\"{o}}pner and
                  Filippos Christianos and
                  Stefano V. Albrecht},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Towards Open Ad Hoc Teamwork Using Graph-based Policy Learning},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {8776--8786},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/rahman21a.html},
  timestamp    = {Thu, 13 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/RahmanHCA21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/AlbrechtBWGEDR21,
  author       = {Stefano V. Albrecht and
                  Cillian Brewitt and
                  John Wilhelm and
                  Balint Gyevnar and
                  Francisco Eiras and
                  Mihai Dobre and
                  Subramanian Ramamoorthy},
  title        = {Interpretable Goal-based Prediction and Planning for Autonomous Driving},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {1043--1049},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9560849},
  doi          = {10.1109/ICRA48506.2021.9560849},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/AlbrechtBWGEDR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/BrewittGGA21,
  author       = {Cillian Brewitt and
                  Balint Gyevnar and
                  Samuel Garcin and
                  Stefano V. Albrecht},
  title        = {{GRIT:} Fast, Interpretable, and Verifiable Goal Recognition with
                  Learned Decision Trees for Autonomous Driving},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021},
  pages        = {1023--1030},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IROS51168.2021.9636279},
  doi          = {10.1109/IROS51168.2021.9636279},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/BrewittGGA21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/PulverECHAR21,
  author       = {Henry Pulver and
                  Francisco Eiras and
                  Ludovico Carozza and
                  Majd Hawasly and
                  Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {{PILOT:} Efficient Planning by Imitation Learning and Optimisation
                  for Safe Autonomous Driving},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021},
  pages        = {1442--1449},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IROS51168.2021.9636862},
  doi          = {10.1109/IROS51168.2021.9636862},
  timestamp    = {Wed, 22 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/PulverECHAR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/HannaRFEDRRA21,
  author       = {Josiah P. Hanna and
                  Arrasy Rahman and
                  Elliot Fosong and
                  Francisco Eiras and
                  Mihai Dobre and
                  John Redford and
                  Subramanian Ramamoorthy and
                  Stefano V. Albrecht},
  title        = {Interpretable Goal Recognition in the Presence of Occluded Factors
                  for Autonomous Vehicles},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021},
  pages        = {7044--7051},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IROS51168.2021.9635903},
  doi          = {10.1109/IROS51168.2021.9635903},
  timestamp    = {Wed, 22 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/HannaRFEDRRA21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PapoudakisC0A21,
  author       = {Georgios Papoudakis and
                  Filippos Christianos and
                  Lukas Sch{\"{a}}fer and
                  Stefano V. Albrecht},
  editor       = {Joaquin Vanschoren and
                  Sai{-}Kit Yeung},
  title        = {Benchmarking Multi-Agent Deep Reinforcement Learning Algorithms in
                  Cooperative Tasks},
  booktitle    = {Proceedings of the Neural Information Processing Systems Track on
                  Datasets and Benchmarks 1, NeurIPS Datasets and Benchmarks 2021, December
                  2021, virtual},
  year         = {2021},
  url          = {https://datasets-benchmarks-proceedings.neurips.cc/paper/2021/hash/a8baa56554f96369ab93e4f3bb068c22-Abstract-round1.html},
  timestamp    = {Thu, 05 May 2022 16:30:03 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/PapoudakisC0A21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PapoudakisCA21,
  author       = {Georgios Papoudakis and
                  Filippos Christianos and
                  Stefano V. Albrecht},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Agent Modelling under Partial Observability for Deep Reinforcement
                  Learning},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {19210--19222},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/a03caec56cd82478bf197475b48c05f9-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/PapoudakisCA21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/paams/AhmedHFA21,
  author       = {Ibrahim Ahmed and
                  Josiah P. Hanna and
                  Elliot Fosong and
                  Stefano V. Albrecht},
  editor       = {Frank Dignum and
                  Juan Manuel Corchado and
                  Fernando de la Prieta},
  title        = {Towards Quantum-Secure Authentication and Key Agreement via Abstract
                  Multi-Agent Interaction},
  booktitle    = {Advances in Practical Applications of Agents, Multi-Agent Systems,
                  and Social Good. The {PAAMS} Collection - 19th International Conference,
                  {PAAMS} 2021, Salamanca, Spain, October 6-8, 2021, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {12946},
  pages        = {14--26},
  publisher    = {Springer},
  year         = {2021},
  url          = {https://doi.org/10.1007/978-3-030-85739-4\_2},
  doi          = {10.1007/978-3-030-85739-4\_2},
  timestamp    = {Tue, 28 Sep 2021 17:51:40 +0200},
  biburl       = {https://dblp.org/rec/conf/paams/AhmedHFA21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-07475,
  author       = {Filippos Christianos and
                  Georgios Papoudakis and
                  Arrasy Rahman and
                  Stefano V. Albrecht},
  title        = {Scaling Multi-Agent Reinforcement Learning with Selective Parameter
                  Sharing},
  journal      = {CoRR},
  volume       = {abs/2102.07475},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.07475},
  eprinttype    = {arXiv},
  eprint       = {2102.07475},
  timestamp    = {Thu, 18 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-07475.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-06113,
  author       = {Cillian Brewitt and
                  Balint Gyevnar and
                  Stefano V. Albrecht},
  title        = {{GRIT:} Verifiable Goal Recognition for Autonomous Driving using Decision
                  Trees},
  journal      = {CoRR},
  volume       = {abs/2103.06113},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.06113},
  eprinttype    = {arXiv},
  eprint       = {2103.06113},
  timestamp    = {Tue, 16 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-06113.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-03982,
  author       = {Shangmin Guo and
                  Yi Ren and
                  Kory W. Mathewson and
                  Simon Kirby and
                  Stefano V. Albrecht and
                  Kenny Smith},
  title        = {Expressivity of Emergent Language is a Trade-off between Contextual
                  Complexity and Unpredictability},
  journal      = {CoRR},
  volume       = {abs/2106.03982},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.03982},
  eprinttype    = {arXiv},
  eprint       = {2106.03982},
  timestamp    = {Fri, 17 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-03982.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-08966,
  author       = {Lukas Sch{\"{a}}fer and
                  Filippos Christianos and
                  Josiah Hanna and
                  Stefano V. Albrecht},
  title        = {Decoupling Exploration and Exploitation in Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2107.08966},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.08966},
  eprinttype    = {arXiv},
  eprint       = {2107.08966},
  timestamp    = {Sun, 29 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-08966.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-02530,
  author       = {Josiah P. Hanna and
                  Arrasy Rahman and
                  Elliot Fosong and
                  Francisco Eiras and
                  Mihai Dobre and
                  John Redford and
                  Subramanian Ramamoorthy and
                  Stefano V. Albrecht},
  title        = {Interpretable Goal Recognition in the Presence of Occluded Factors
                  for Autonomous Vehicles},
  journal      = {CoRR},
  volume       = {abs/2108.02530},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.02530},
  eprinttype    = {arXiv},
  eprint       = {2108.02530},
  timestamp    = {Wed, 11 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-02530.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-04935,
  author       = {Trevor McInroe and
                  Lukas Sch{\"{a}}fer and
                  Stefano V. Albrecht},
  title        = {Learning Temporally-Consistent Representations for Data-Efficient
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2110.04935},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.04935},
  eprinttype    = {arXiv},
  eprint       = {2110.04935},
  timestamp    = {Thu, 21 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-04935.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-14552,
  author       = {Rujie Zhong and
                  Josiah P. Hanna and
                  Lukas Sch{\"{a}}fer and
                  Stefano V. Albrecht},
  title        = {Robust On-Policy Data Collection for Data-Efficient Policy Evaluation},
  journal      = {CoRR},
  volume       = {abs/2111.14552},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.14552},
  eprinttype    = {arXiv},
  eprint       = {2111.14552},
  timestamp    = {Wed, 01 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-14552.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/AlbrechtSW20,
  author       = {Stefano V. Albrecht and
                  Peter Stone and
                  Michael P. Wellman},
  title        = {Special issue on autonomous agents modelling other agents: Guest editorial},
  journal      = {Artif. Intell.},
  volume       = {285},
  pages        = {103292},
  year         = {2020},
  url          = {https://doi.org/10.1016/j.artint.2020.103292},
  doi          = {10.1016/J.ARTINT.2020.103292},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ai/AlbrechtSW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChristianosSA20,
  author       = {Filippos Christianos and
                  Lukas Sch{\"{a}}fer and
                  Stefano V. Albrecht},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Shared Experience Actor-Critic for Multi-Agent Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/7967cc8e3ab559e68cc944c44b1cf3e8-Abstract.html},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ChristianosSA20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-10829,
  author       = {Georgios Papoudakis and
                  Stefano V. Albrecht},
  title        = {Variational Autoencoders for Opponent Modeling in Multi-Agent Systems},
  journal      = {CoRR},
  volume       = {abs/2001.10829},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.10829},
  eprinttype    = {arXiv},
  eprint       = {2001.10829},
  timestamp    = {Thu, 30 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-10829.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-02215,
  author       = {Francisco Eiras and
                  Majd Hawasly and
                  Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {A Two-Stage Optimization Approach to Safe-by-Design Planning for Autonomous
                  Driving},
  journal      = {CoRR},
  volume       = {abs/2002.02215},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02215},
  eprinttype    = {arXiv},
  eprint       = {2002.02215},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02215.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-02277,
  author       = {Stefano V. Albrecht and
                  Cillian Brewitt and
                  John Wilhelm and
                  Francisco Eiras and
                  Mihai Dobre and
                  Subramanian Ramamoorthy},
  title        = {Integrating Planning and Interpretable Goal Recognition for Autonomous
                  Driving},
  journal      = {CoRR},
  volume       = {abs/2002.02277},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02277},
  eprinttype    = {arXiv},
  eprint       = {2002.02277},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02277.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-07169,
  author       = {Filippos Christianos and
                  Lukas Sch{\"{a}}fer and
                  Stefano V. Albrecht},
  title        = {Shared Experience Actor-Critic for Multi-Agent Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2006.07169},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.07169},
  eprinttype    = {arXiv},
  eprint       = {2006.07169},
  timestamp    = {Sun, 29 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-07169.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-07869,
  author       = {Georgios Papoudakis and
                  Filippos Christianos and
                  Lukas Sch{\"{a}}fer and
                  Stefano V. Albrecht},
  title        = {Comparative Evaluation of Multi-Agent Deep Reinforcement Learning
                  Algorithms},
  journal      = {CoRR},
  volume       = {abs/2006.07869},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.07869},
  eprinttype    = {arXiv},
  eprint       = {2006.07869},
  timestamp    = {Sun, 29 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-07869.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-09447,
  author       = {Georgios Papoudakis and
                  Filippos Christianos and
                  Stefano V. Albrecht},
  title        = {Opponent Modelling with Local Information Variational Autoencoders},
  journal      = {CoRR},
  volume       = {abs/2006.09447},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.09447},
  eprinttype    = {arXiv},
  eprint       = {2006.09447},
  timestamp    = {Tue, 23 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-09447.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-10412,
  author       = {Arrasy Rahman and
                  Niklas H{\"{o}}pner and
                  Filippos Christianos and
                  Stefano V. Albrecht},
  title        = {Open Ad Hoc Teamwork using Graph-based Policy Learning},
  journal      = {CoRR},
  volume       = {abs/2006.10412},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.10412},
  eprinttype    = {arXiv},
  eprint       = {2006.10412},
  timestamp    = {Thu, 13 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-10412.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-09327,
  author       = {Ibrahim Ahmed and
                  Josiah P. Hanna and
                  Stefano V. Albrecht},
  title        = {Quantum-Secure Authentication via Abstract Multi-Agent Interaction},
  journal      = {CoRR},
  volume       = {abs/2007.09327},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.09327},
  eprinttype    = {arXiv},
  eprint       = {2007.09327},
  timestamp    = {Fri, 31 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-09327.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-00509,
  author       = {Henry Pulver and
                  Francisco Eiras and
                  Ludovico Carozza and
                  Majd Hawasly and
                  Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {{PILOT:} Efficient Planning by Imitation Learning and Optimisation
                  for Safe Autonomous Driving},
  journal      = {CoRR},
  volume       = {abs/2011.00509},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.00509},
  eprinttype    = {arXiv},
  eprint       = {2011.00509},
  timestamp    = {Fri, 06 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-00509.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-04737,
  author       = {Georgios Papoudakis and
                  Filippos Christianos and
                  Arrasy Rahman and
                  Stefano V. Albrecht},
  title        = {Dealing with Non-Stationarity in Multi-Agent Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1906.04737},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.04737},
  eprinttype    = {arXiv},
  eprint       = {1906.04737},
  timestamp    = {Fri, 14 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-04737.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-11064,
  author       = {Stefano V. Albrecht and
                  Peter Stone},
  title        = {Reasoning about Hypothetical Agent Behaviours and their Parameters},
  journal      = {CoRR},
  volume       = {abs/1906.11064},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.11064},
  eprinttype    = {arXiv},
  eprint       = {1906.11064},
  timestamp    = {Thu, 27 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-11064.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-01912,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {Are You Doing What {I} Think You Are Doing? Criticising Uncertain
                  Agent Models},
  journal      = {CoRR},
  volume       = {abs/1907.01912},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.01912},
  eprinttype    = {arXiv},
  eprint       = {1907.01912},
  timestamp    = {Mon, 08 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-01912.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-05247,
  author       = {Stefano V. Albrecht and
                  Jacob W. Crandall and
                  Subramanian Ramamoorthy},
  title        = {An Empirical Study on the Practical Impact of Prior Beliefs over Policy
                  Types},
  journal      = {CoRR},
  volume       = {abs/1907.05247},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.05247},
  eprinttype    = {arXiv},
  eprint       = {1907.05247},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-05247.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-05850,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {Exploiting Causality for Selective Belief Filtering in Dynamic Bayesian
                  Networks (Extended Abstract)},
  journal      = {CoRR},
  volume       = {abs/1907.05850},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.05850},
  eprinttype    = {arXiv},
  eprint       = {1907.05850},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-05850.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-06995,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {On Convergence and Optimality of Best-Response Learning with Policy
                  Types in Multiagent Systems},
  journal      = {CoRR},
  volume       = {abs/1907.06995},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.06995},
  eprinttype    = {arXiv},
  eprint       = {1907.06995},
  timestamp    = {Tue, 23 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-06995.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-09189,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {Comparative Evaluation of Multiagent Learning Algorithms in a Diverse
                  Set of Ad Hoc Team Problems},
  journal      = {CoRR},
  volume       = {abs/1907.09189},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.09189},
  eprinttype    = {arXiv},
  eprint       = {1907.09189},
  timestamp    = {Tue, 30 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-09189.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-09810,
  author       = {Stefano V. Albrecht and
                  Jacob W. Crandall and
                  Subramanian Ramamoorthy},
  title        = {{E-HBA:} Using Action Policies for Expert Advice and Agent Typification},
  journal      = {CoRR},
  volume       = {abs/1907.09810},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.09810},
  eprinttype    = {arXiv},
  eprint       = {1907.09810},
  timestamp    = {Tue, 30 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-09810.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-00927,
  author       = {Maciej Wiatrak and
                  Stefano V. Albrecht},
  title        = {Stabilizing Generative Adversarial Network Training: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/1910.00927},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.00927},
  eprinttype    = {arXiv},
  eprint       = {1910.00927},
  timestamp    = {Fri, 04 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-00927.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/AlbrechtS18,
  author       = {Stefano V. Albrecht and
                  Peter Stone},
  title        = {Autonomous agents modelling other agents: {A} comprehensive survey
                  and open problems},
  journal      = {Artif. Intell.},
  volume       = {258},
  pages        = {66--95},
  year         = {2018},
  url          = {https://doi.org/10.1016/j.artint.2018.01.002},
  doi          = {10.1016/J.ARTINT.2018.01.002},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ai/AlbrechtS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-03331,
  author       = {Craig Innes and
                  Alex Lascarides and
                  Stefano V. Albrecht and
                  Subramanian Ramamoorthy and
                  Benjamin Rosman},
  title        = {Reasoning about Unforeseen Possibilities During Policy Learning},
  journal      = {CoRR},
  volume       = {abs/1801.03331},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.03331},
  eprinttype    = {arXiv},
  eprint       = {1801.03331},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-03331.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/AlbrechtLS17,
  author       = {Stefano V. Albrecht and
                  Somchaya Liemhetcharat and
                  Peter Stone},
  title        = {Special issue on multiagent interaction without prior coordination:
                  guest editorial},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {31},
  number       = {4},
  pages        = {765--766},
  year         = {2017},
  url          = {https://doi.org/10.1007/s10458-016-9358-0},
  doi          = {10.1007/S10458-016-9358-0},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aamas/AlbrechtLS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AlbrechtS17,
  author       = {Stefano V. Albrecht and
                  Peter Stone},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Reasoning about Hypothetical Agent Behaviours and their Parameters},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {547--555},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091206},
  timestamp    = {Wed, 27 Sep 2017 07:24:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AlbrechtS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/AlbrechtR17,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  editor       = {Carles Sierra},
  title        = {Exploiting Causality for Selective Belief Filtering in Dynamic Bayesian
                  Networks (Extended Abstract)},
  booktitle    = {Proceedings of the Twenty-Sixth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August
                  19-25, 2017},
  pages        = {5085--5089},
  publisher    = {ijcai.org},
  year         = {2017},
  url          = {https://doi.org/10.24963/ijcai.2017/727},
  doi          = {10.24963/IJCAI.2017/727},
  timestamp    = {Tue, 20 Aug 2019 16:16:54 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/AlbrechtR17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-08071,
  author       = {Stefano V. Albrecht and
                  Peter Stone},
  title        = {Autonomous Agents Modelling Other Agents: {A} Comprehensive Survey
                  and Open Problems},
  journal      = {CoRR},
  volume       = {abs/1709.08071},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.08071},
  eprinttype    = {arXiv},
  eprint       = {1709.08071},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-08071.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/AlbrechtCR16,
  author       = {Stefano V. Albrecht and
                  Jacob W. Crandall and
                  Subramanian Ramamoorthy},
  title        = {Belief and truth in hypothesised behaviours},
  journal      = {Artif. Intell.},
  volume       = {235},
  pages        = {63--94},
  year         = {2016},
  url          = {https://doi.org/10.1016/j.artint.2016.02.004},
  doi          = {10.1016/J.ARTINT.2016.02.004},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ai/AlbrechtCR16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/AlbrechtBBBCCDF16,
  author       = {Stefano V. Albrecht and
                  Bruno Bouchard and
                  John S. Brownstein and
                  David L. Buckeridge and
                  Cornelia Caragea and
                  Kevin M. Carter and
                  Adnan Darwiche and
                  Blaz Fortuna and
                  Yannick Francillette and
                  S{\'{e}}bastien Gaboury and
                  C. Lee Giles and
                  Marko Grobelnik and
                  Estevam R. Hruschka Jr. and
                  Jeffrey O. Kephart and
                  Parisa Kordjamshidi and
                  Viliam Lis{\'{y}} and
                  Daniele Magazzeni and
                  Jo{\~{a}}o Marques{-}Silva and
                  Pierre Marquis and
                  David R. Martinez and
                  Marek P. Michalowski and
                  Arash Shaban{-}Nejad and
                  Zeinab Noorian and
                  Enrico Pontelli and
                  Alex Rogers and
                  Stephanie Rosenthal and
                  Dan Roth and
                  Arunesh Sinha and
                  William W. Streilein and
                  Sylvie Thi{\'{e}}baux and
                  Tran Cao Son and
                  Byron C. Wallace and
                  Toby Walsh and
                  Michael Witbrock and
                  Jie Zhang},
  title        = {Reports of the 2016 {AAAI} Workshop Program},
  journal      = {{AI} Mag.},
  volume       = {37},
  number       = {3},
  pages        = {99--108},
  year         = {2016},
  url          = {https://doi.org/10.1609/aimag.v37i3.2680},
  doi          = {10.1609/AIMAG.V37I3.2680},
  timestamp    = {Tue, 18 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/AlbrechtBBBCCDF16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/AlbrechtR16,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {Exploiting Causality for Selective Belief Filtering in Dynamic Bayesian
                  Networks},
  journal      = {J. Artif. Intell. Res.},
  volume       = {55},
  pages        = {1135--1178},
  year         = {2016},
  url          = {https://doi.org/10.1613/jair.5044},
  doi          = {10.1613/JAIR.5044},
  timestamp    = {Mon, 21 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/AlbrechtR16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/aaai/2016ma,
  editor       = {Stefano V. Albrecht and
                  Katie Genter and
                  Somchaya Liemhetcharat},
  title        = {Multiagent Interaction without Prior Coordination, Papers from the
                  2016 {AAAI} Workshop, Phoenix, Arizona, USA, February 13, 2016},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-16-11}},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {http://www.aaai.org/Library/Workshops/ws16-11.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/2016ma.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@phdthesis{DBLP:phd/ethos/Albrecht15,
  author       = {Stefano Vittorino Albrecht},
  title        = {Utilising policy types for effective ad hoc coordination in multiagent
                  systems},
  school       = {University of Edinburgh, {UK}},
  year         = {2015},
  url          = {https://ethos.bl.uk/OrderDetails.do?uin=uk.bl.ethos.693660},
  timestamp    = {Wed, 04 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/phd/ethos/Albrecht15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/AlbrechtBBBCDEF15,
  author       = {Stefano V. Albrecht and
                  Andr{\'{e}} da Motta Salles Barreto and
                  Darius Braziunas and
                  David L. Buckeridge and
                  Heriberto Cuay{\'{a}}huitl and
                  Nina Dethlefs and
                  Markus Endres and
                  Amir{-}massoud Farahmand and
                  Mark Fox and
                  Lutz Frommberger and
                  Sam Ganzfried and
                  Yolanda Gil and
                  S{\'{e}}bastien Guillet and
                  Lawrence E. Hunter and
                  Arnav Jhala and
                  Kristian Kersting and
                  George Dimitri Konidaris and
                  Freddy L{\'{e}}cu{\'{e}} and
                  Sheila A. McIlraith and
                  Sriraam Natarajan and
                  Zeinab Noorian and
                  David Poole and
                  R{\'{e}}mi Ronfard and
                  Alessandro Saffiotti and
                  Arash Shaban{-}Nejad and
                  Biplav Srivastava and
                  Gerald Tesauro and
                  Rosario Uceda{-}Sosa and
                  Guy Van den Broeck and
                  Martijn van Otterlo and
                  Byron C. Wallace and
                  Paul Weng and
                  Jenna Wiens and
                  Jie Zhang},
  title        = {Reports of the {AAAI} 2014 Conference Workshops},
  journal      = {{AI} Mag.},
  volume       = {36},
  number       = {1},
  pages        = {87--98},
  year         = {2015},
  url          = {https://doi.org/10.1609/aimag.v36i1.2575},
  doi          = {10.1609/AIMAG.V36I1.2575},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/AlbrechtBBBCDEF15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/AlbrechtCR15,
  author       = {Stefano Vittorino Albrecht and
                  Jacob William Crandall and
                  Subramanian Ramamoorthy},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {An Empirical Study on the Practical Impact of Prior Beliefs over Policy
                  Types},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {1988--1994},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9426},
  doi          = {10.1609/AAAI.V29I1.9426},
  timestamp    = {Sat, 21 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AlbrechtCR15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/AlbrechtR15,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  editor       = {Marina Meila and
                  Tom Heskes},
  title        = {Are You Doing What {I} Think You Are Doing? Criticising Uncertain
                  Agent Models},
  booktitle    = {Proceedings of the Thirty-First Conference on Uncertainty in Artificial
                  Intelligence, {UAI} 2015, July 12-16, 2015, Amsterdam, The Netherlands},
  pages        = {52--61},
  publisher    = {{AUAI} Press},
  year         = {2015},
  url          = {http://auai.org/uai2015/proceedings/papers/37.pdf},
  timestamp    = {Thu, 12 Mar 2020 11:31:09 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/AlbrechtR15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/AlbrechtLBBCCDD15,
  author       = {Stefano V. Albrecht and
                  J. Christopher Beck and
                  David L. Buckeridge and
                  Adi Botea and
                  Cornelia Caragea and
                  Chi{-}Hung Chi and
                  Theodoros Damoulas and
                  Bistra Dilkina and
                  Eric Eaton and
                  Pooyan Fazli and
                  Sam Ganzfried and
                  Marius Lindauer and
                  Marlos C. Machado and
                  Yuri Malitsky and
                  Gary Marcus and
                  Sebastiaan A. Meijer and
                  Francesca Rossi and
                  Arash Shaban{-}Nejad and
                  Sylvie Thi{\'{e}}baux and
                  Manuela M. Veloso and
                  Toby Walsh and
                  Can Wang and
                  Jie Zhang and
                  Yu Zheng},
  title        = {Reports from the 2015 {AAAI} Workshop Program},
  journal      = {{AI} Mag.},
  volume       = {36},
  number       = {2},
  pages        = {90--101},
  year         = {2015},
  url          = {https://doi.org/10.1609/aimag.v36i2.2590},
  doi          = {10.1609/AIMAG.V36I2.2590},
  timestamp    = {Tue, 23 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aim/AlbrechtLBBCCDD15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AlbrechtR15,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {A Game-Theoretic Model and Best-Response Learning Method for Ad Hoc
                  Coordination in Multiagent Systems},
  journal      = {CoRR},
  volume       = {abs/1506.01170},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.01170},
  eprinttype    = {arXiv},
  eprint       = {1506.01170},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AlbrechtR15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AlbrechtCR15,
  author       = {Stefano V. Albrecht and
                  Jacob W. Crandall and
                  Subramanian Ramamoorthy},
  title        = {Belief and Truth in Hypothesised Behaviours},
  journal      = {CoRR},
  volume       = {abs/1507.07688},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.07688},
  eprinttype    = {arXiv},
  eprint       = {1507.07688},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AlbrechtCR15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/AlbrechtR14,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  editor       = {Nevin L. Zhang and
                  Jin Tian},
  title        = {On Convergence and Optimality of Best-Response Learning with Policy
                  Types in Multiagent Systems},
  booktitle    = {Proceedings of the Thirtieth Conference on Uncertainty in Artificial
                  Intelligence, {UAI} 2014, Quebec City, Quebec, Canada, July 23-27,
                  2014},
  pages        = {12--21},
  publisher    = {{AUAI} Press},
  year         = {2014},
  url          = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=2436\&\#38;proceeding\_id=30},
  timestamp    = {Wed, 03 Feb 2021 11:09:27 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/AlbrechtR14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AlbrechtR14,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  title        = {Exploiting Causality for Efficient Monitoring in POMDPs},
  journal      = {CoRR},
  volume       = {abs/1401.7941},
  year         = {2014},
  url          = {http://arxiv.org/abs/1401.7941},
  eprinttype    = {arXiv},
  eprint       = {1401.7941},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AlbrechtR14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AlbrechtR13,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  editor       = {Maria L. Gini and
                  Onn Shehory and
                  Takayuki Ito and
                  Catholijn M. Jonker},
  title        = {A game-theoretic model and best-response learning method for ad hoc
                  coordination in multiagent systems},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages        = {1155--1156},
  publisher    = {{IFAAMAS}},
  year         = {2013},
  url          = {http://dl.acm.org/citation.cfm?id=2485118},
  timestamp    = {Thu, 09 Sep 2021 16:09:54 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AlbrechtR13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AlbrechtR13a,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  editor       = {Maria L. Gini and
                  Onn Shehory and
                  Takayuki Ito and
                  Catholijn M. Jonker},
  title        = {Ad hoc coordination in multiagent systems with applications to human-machine
                  interaction},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages        = {1415--1416},
  publisher    = {{IFAAMAS}},
  year         = {2013},
  url          = {http://dl.acm.org/citation.cfm?id=2485253},
  timestamp    = {Fri, 28 Jun 2013 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AlbrechtR13a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aamas/AlbrechtR12,
  author       = {Stefano V. Albrecht and
                  Subramanian Ramamoorthy},
  editor       = {Wiebe van der Hoek and
                  Lin Padgham and
                  Vincent Conitzer and
                  Michael Winikoff},
  title        = {Comparative evaluation of {MAL} algorithms in a diverse set of ad
                  hoc team problems},
  booktitle    = {International Conference on Autonomous Agents and Multiagent Systems,
                  {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)},
  pages        = {349--356},
  publisher    = {{IFAAMAS}},
  year         = {2012},
  url          = {http://dl.acm.org/citation.cfm?id=2343626},
  timestamp    = {Thu, 19 Mar 2015 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aamas/AlbrechtR12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics