BibTeX records: Joelle Pineau

download as .bib file

@inproceedings{DBLP:conf/cslaw/0002HDP24,
  author       = {Peter Henderson and
                  Jieru Hu and
                  Mona T. Diab and
                  Joelle Pineau},
  title        = {Rethinking Machine Learning Benchmarks in the Context of Professional
                  Codes of Conduct},
  booktitle    = {Proceedings of the Symposium on Computer Science and Law, {CSLAW}
                  2024, Boston, MA, USA, March 12-13, 2024},
  pages        = {109--120},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://doi.org/10.1145/3614407.3643708},
  doi          = {10.1145/3614407.3643708},
  timestamp    = {Mon, 15 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cslaw/0002HDP24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WabarthaP24,
  author       = {Maxime Wabartha and
                  Joelle Pineau},
  title        = {Piecewise Linear Parametrization of Policies: Towards Interpretable
                  Deep Reinforcement Learning},
  booktitle    = {The Twelfth International Conference on Learning Representations,
                  {ICLR} 2024, Vienna, Austria, May 7-11, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=hOMVq57Ce0},
  timestamp    = {Wed, 07 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WabarthaP24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KapoorBKLRCHBBB24,
  author       = {Sayash Kapoor and
                  Rishi Bommasani and
                  Kevin Klyman and
                  Shayne Longpre and
                  Ashwin Ramaswami and
                  Peter Cihon and
                  Aspen K. Hopkins and
                  Kevin Bankston and
                  Stella Biderman and
                  Miranda Bogen and
                  Rumman Chowdhury and
                  Alex Engler and
                  Peter Henderson and
                  Yacine Jernite and
                  Seth Lazar and
                  Stefano Maffulli and
                  Alondra Nelson and
                  Joelle Pineau and
                  Aviya Skowron and
                  Dawn Song and
                  Victor Storchan and
                  Daniel Zhang and
                  Daniel E. Ho and
                  Percy Liang and
                  Arvind Narayanan},
  title        = {Position: On the Societal Impact of Open Foundation Models},
  booktitle    = {Forty-first International Conference on Machine Learning, {ICML} 2024,
                  Vienna, Austria, July 21-27, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=jRX6yCxFhx},
  timestamp    = {Mon, 02 Sep 2024 16:45:29 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KapoorBKLRCHBBB24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-07918,
  author       = {Sayash Kapoor and
                  Rishi Bommasani and
                  Kevin Klyman and
                  Shayne Longpre and
                  Ashwin Ramaswami and
                  Peter Cihon and
                  Aspen K. Hopkins and
                  Kevin Bankston and
                  Stella Biderman and
                  Miranda Bogen and
                  Rumman Chowdhury and
                  Alex Engler and
                  Peter Henderson and
                  Yacine Jernite and
                  Seth Lazar and
                  Stefano Maffulli and
                  Alondra Nelson and
                  Joelle Pineau and
                  Aviya Skowron and
                  Dawn Song and
                  Victor Storchan and
                  Daniel Zhang and
                  Daniel E. Ho and
                  Percy Liang and
                  Arvind Narayanan},
  title        = {On the Societal Impact of Open Foundation Models},
  journal      = {CoRR},
  volume       = {abs/2403.07918},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.07918},
  doi          = {10.48550/ARXIV.2403.07918},
  eprinttype    = {arXiv},
  eprint       = {2403.07918},
  timestamp    = {Thu, 29 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-07918.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/eor/CousineauVMP23,
  author       = {Martin Cousineau and
                  Vedat Verter and
                  Susan A. Murphy and
                  Joelle Pineau},
  title        = {Estimating causal effects with optimization-based methods: {A} review
                  and empirical comparison},
  journal      = {Eur. J. Oper. Res.},
  volume       = {304},
  number       = {2},
  pages        = {367--380},
  year         = {2023},
  url          = {https://doi.org/10.1016/j.ejor.2022.01.046},
  doi          = {10.1016/J.EJOR.2022.01.046},
  timestamp    = {Mon, 24 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/eor/CousineauVMP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/natmi/SrikumarFAACCHJLOP23,
  author       = {Madhulika Srikumar and
                  Rebecca Finlay and
                  Grace Abuhamad and
                  Carolyn Ashurst and
                  Rosie Campbell and
                  Emily Campbell{-}Ratcliffe and
                  Hudson Hongo and
                  Sara R. Jordan and
                  Joseph Lindley and
                  Aviv Ovadya and
                  Joelle Pineau},
  title        = {Publisher Correction: Advancing ethics review practices in {AI} research},
  journal      = {Nat. Mac. Intell.},
  volume       = {5},
  number       = {1},
  pages        = {94},
  year         = {2023},
  url          = {https://doi.org/10.1038/s42256-023-00608-6},
  doi          = {10.1038/S42256-023-00608-6},
  timestamp    = {Fri, 19 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/natmi/SrikumarFAACCHJLOP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tacl/SachanLYZPZ23,
  author       = {Devendra Singh Sachan and
                  Mike Lewis and
                  Dani Yogatama and
                  Luke Zettlemoyer and
                  Joelle Pineau and
                  Manzil Zaheer},
  title        = {Questions Are All You Need to Train a Dense Passage Retriever},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {11},
  pages        = {600--616},
  year         = {2023},
  url          = {https://doi.org/10.1162/tacl\_a\_00564},
  doi          = {10.1162/TACL\_A\_00564},
  timestamp    = {Wed, 19 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/SachanLYZPZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmlr/SatijaLPP23,
  author       = {Harsh Satija and
                  Alessandro Lazaric and
                  Matteo Pirotta and
                  Joelle Pineau},
  title        = {Group Fairness in Reinforcement Learning},
  journal      = {Trans. Mach. Learn. Res.},
  volume       = {2023},
  year         = {2023},
  url          = {https://openreview.net/forum?id=JkIH4MeOc3},
  timestamp    = {Thu, 18 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmlr/SatijaLPP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aiedu/KochmarVBGSP22,
  author       = {Ekaterina Kochmar and
                  Dung Do Vu and
                  Robert Belfer and
                  Varun Gupta and
                  Iulian Vlad Serban and
                  Joelle Pineau},
  title        = {Automated Data-Driven Generation of Personalized Pedagogical Interventions
                  in Intelligent Tutoring Systems},
  journal      = {Int. J. Artif. Intell. Educ.},
  volume       = {32},
  number       = {2},
  pages        = {323--349},
  year         = {2022},
  url          = {https://doi.org/10.1007/s40593-021-00267-x},
  doi          = {10.1007/S40593-021-00267-X},
  timestamp    = {Mon, 08 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aiedu/KochmarVBGSP22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/MazoureDLMPPR22,
  author       = {Bogdan Mazoure and
                  Thang Doan and
                  Tianyu Li and
                  Vladimir Makarenkov and
                  Joelle Pineau and
                  Doina Precup and
                  Guillaume Rabusseau},
  title        = {Low-Rank Representation of Reinforcement Learning Policies},
  journal      = {J. Artif. Intell. Res.},
  volume       = {75},
  pages        = {597--636},
  year         = {2022},
  url          = {https://doi.org/10.1613/jair.1.13854},
  doi          = {10.1613/JAIR.1.13854},
  timestamp    = {Sat, 05 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/MazoureDLMPPR22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/natmi/SrikumarFAACCHJLOP22,
  author       = {Madhulika Srikumar and
                  Rebecca Finlay and
                  Grace Abuhamad and
                  Carolyn Ashurst and
                  Rosie Campbell and
                  Emily Campbell{-}Ratcliffe and
                  Hudson Hongo and
                  Sara R. Jordan and
                  Joseph Lindley and
                  Aviv Ovadya and
                  Joelle Pineau},
  title        = {Advancing ethics review practices in {AI} research},
  journal      = {Nat. Mac. Intell.},
  volume       = {4},
  number       = {12},
  pages        = {1061--1064},
  year         = {2022},
  url          = {https://doi.org/10.1038/s42256-022-00585-2},
  doi          = {10.1038/S42256-022-00585-2},
  timestamp    = {Wed, 17 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/natmi/SrikumarFAACCHJLOP22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/GX-ChenCRP22,
  author       = {Anthony GX{-}Chen and
                  Veronica Chelu and
                  Blake A. Richards and
                  Joelle Pineau},
  title        = {A Generalized Bootstrap Target for Value-Learning, Efficiently Combining
                  Value and Feature Predictions},
  booktitle    = {Thirty-Sixth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2022, Thirty-Fourth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2022, The Twelveth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2022 Virtual Event, February 22
                  - March 1, 2022},
  pages        = {6829--6837},
  publisher    = {{AAAI} Press},
  year         = {2022},
  url          = {https://doi.org/10.1609/aaai.v36i6.20639},
  doi          = {10.1609/AAAI.V36I6.20639},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/GX-ChenCRP22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SachanLJAYPZ22,
  author       = {Devendra Singh Sachan and
                  Mike Lewis and
                  Mandar Joshi and
                  Armen Aghajanyan and
                  Wen{-}tau Yih and
                  Joelle Pineau and
                  Luke Zettlemoyer},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {Improving Passage Retrieval with Zero-Shot Question Generation},
  booktitle    = {Proceedings of the 2022 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates,
                  December 7-11, 2022},
  pages        = {3781--3797},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.emnlp-main.249},
  doi          = {10.18653/V1/2022.EMNLP-MAIN.249},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SachanLJAYPZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SinhaKRPHW22,
  author       = {Koustuv Sinha and
                  Amirhossein Kazemnejad and
                  Siva Reddy and
                  Joelle Pineau and
                  Dieuwke Hupkes and
                  Adina Williams},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {The Curious Case of Absolute Position Embeddings},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022},
  pages        = {4449--4472},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-emnlp.326},
  doi          = {10.18653/V1/2022.FINDINGS-EMNLP.326},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SinhaKRPHW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/CacciaAATPB22,
  author       = {Lucas Caccia and
                  Rahaf Aljundi and
                  Nader Asadi and
                  Tinne Tuytelaars and
                  Joelle Pineau and
                  Eugene Belilovsky},
  title        = {New Insights on Reducing Abrupt Representation Change in Online Continual
                  Learning},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=N8MaByOzUfb},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/CacciaAATPB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/XieSFP022,
  author       = {Annie Xie and
                  Shagun Sodhani and
                  Chelsea Finn and
                  Joelle Pineau and
                  Amy Zhang},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Robust Policy Learning over Multiple Uncertainty Sets},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {24414--24429},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/xie22c.html},
  timestamp    = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/XieSFP022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/l4dc/SodhaniMP022,
  author       = {Shagun Sodhani and
                  Franziska Meier and
                  Joelle Pineau and
                  Amy Zhang},
  editor       = {Roya Firoozi and
                  Negar Mehr and
                  Esen Yel and
                  Rika Antonova and
                  Jeannette Bohg and
                  Mac Schwager and
                  Mykel J. Kochenderfer},
  title        = {Block Contextual MDPs for Continual Learning},
  booktitle    = {Learning for Dynamics and Control Conference, {L4DC} 2022, 23-24 June
                  2022, Stanford University, Stanford, CA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {168},
  pages        = {608--623},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v168/sodhani22a.html},
  timestamp    = {Fri, 20 May 2022 14:36:40 +0200},
  biburl       = {https://dblp.org/rec/conf/l4dc/SodhaniMP022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-01836,
  author       = {Anthony GX{-}Chen and
                  Veronica Chelu and
                  Blake A. Richards and
                  Joelle Pineau},
  title        = {A Generalized Bootstrap Target for Value-Learning, Efficiently Combining
                  Value and Feature Predictions},
  journal      = {CoRR},
  volume       = {abs/2201.01836},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.01836},
  eprinttype    = {arXiv},
  eprint       = {2201.01836},
  timestamp    = {Mon, 10 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-01836.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-07013,
  author       = {Annie Xie and
                  Shagun Sodhani and
                  Chelsea Finn and
                  Joelle Pineau and
                  Amy Zhang},
  title        = {Robust Policy Learning over Multiple Uncertainty Sets},
  journal      = {CoRR},
  volume       = {abs/2202.07013},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.07013},
  eprinttype    = {arXiv},
  eprint       = {2202.07013},
  timestamp    = {Fri, 18 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-07013.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-09826,
  author       = {Thang Doan and
                  Seyed{-}Iman Mirzadeh and
                  Joelle Pineau and
                  Mehrdad Farajtabar},
  title        = {Efficient Continual Learning Ensembles in Neural Network Subspaces},
  journal      = {CoRR},
  volume       = {abs/2202.09826},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.09826},
  eprinttype    = {arXiv},
  eprint       = {2202.09826},
  timestamp    = {Tue, 01 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-09826.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-00097,
  author       = {Martin Cousineau and
                  Vedat Verter and
                  Susan A. Murphy and
                  Joelle Pineau},
  title        = {Estimating causal effects with optimization-based methods: {A} review
                  and empirical comparison},
  journal      = {CoRR},
  volume       = {abs/2203.00097},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.00097},
  doi          = {10.48550/ARXIV.2203.00097},
  eprinttype    = {arXiv},
  eprint       = {2203.00097},
  timestamp    = {Wed, 16 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-00097.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-07496,
  author       = {Devendra Singh Sachan and
                  Mike Lewis and
                  Mandar Joshi and
                  Armen Aghajanyan and
                  Wen{-}tau Yih and
                  Joelle Pineau and
                  Luke Zettlemoyer},
  title        = {Improving Passage Retrieval with Zero-Shot Question Generation},
  journal      = {CoRR},
  volume       = {abs/2204.07496},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.07496},
  doi          = {10.48550/ARXIV.2204.07496},
  eprinttype    = {arXiv},
  eprint       = {2204.07496},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-07496.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-10658,
  author       = {Devendra Singh Sachan and
                  Mike Lewis and
                  Dani Yogatama and
                  Luke Zettlemoyer and
                  Joelle Pineau and
                  Manzil Zaheer},
  title        = {Questions Are All You Need to Train a Dense Passage Retriever},
  journal      = {CoRR},
  volume       = {abs/2206.10658},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.10658},
  doi          = {10.48550/ARXIV.2206.10658},
  eprinttype    = {arXiv},
  eprint       = {2206.10658},
  timestamp    = {Mon, 27 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-10658.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-12574,
  author       = {Koustuv Sinha and
                  Amirhossein Kazemnejad and
                  Siva Reddy and
                  Joelle Pineau and
                  Dieuwke Hupkes and
                  Adina Williams},
  title        = {The Curious Case of Absolute Position Embeddings},
  journal      = {CoRR},
  volume       = {abs/2210.12574},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.12574},
  doi          = {10.48550/ARXIV.2210.12574},
  eprinttype    = {arXiv},
  eprint       = {2210.12574},
  timestamp    = {Fri, 28 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-12574.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/PineauVSLBdFL21,
  author       = {Joelle Pineau and
                  Philippe Vincent{-}Lamarre and
                  Koustuv Sinha and
                  Vincent Larivi{\`{e}}re and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Hugo Larochelle},
  title        = {Improving Reproducibility in Machine Learning Research(A Report from
                  the NeurIPS 2019 Reproducibility Program)},
  journal      = {J. Mach. Learn. Res.},
  volume       = {22},
  pages        = {164:1--164:20},
  year         = {2021},
  url          = {https://jmlr.org/papers/v22/20-303.html},
  timestamp    = {Wed, 11 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/PineauVSLBdFL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Yarats0KAPF21,
  author       = {Denis Yarats and
                  Amy Zhang and
                  Ilya Kostrikov and
                  Brandon Amos and
                  Joelle Pineau and
                  Rob Fergus},
  title        = {Improving Sample Efficiency in Model-Free Reinforcement Learning from
                  Images},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {10674--10681},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i12.17276},
  doi          = {10.1609/AAAI.V35I12.17276},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Yarats0KAPF21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SinhaPPW20,
  author       = {Koustuv Sinha and
                  Prasanna Parthasarathi and
                  Joelle Pineau and
                  Adina Williams},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {UnNatural Language Inference},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {7329--7346},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.569},
  doi          = {10.18653/V1/2021.ACL-LONG.569},
  timestamp    = {Mon, 09 Aug 2021 16:25:37 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SinhaPPW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/Romoff0KBTBP21,
  author       = {Joshua Romoff and
                  Peter Henderson and
                  David Kanaa and
                  Emmanuel Bengio and
                  Ahmed Touati and
                  Pierre{-}Luc Bacon and
                  Joelle Pineau},
  editor       = {Frank Dignum and
                  Alessio Lomuscio and
                  Ulle Endriss and
                  Ann Now{\'{e}}},
  title        = {TDprop: Does Adaptive Optimization With Jacobi Preconditioning Help
                  Temporal Difference Learning?},
  booktitle    = {{AAMAS} '21: 20th International Conference on Autonomous Agents and
                  Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021},
  pages        = {1082--1090},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p1082.pdf},
  doi          = {10.5555/3463952.3464078},
  timestamp    = {Wed, 20 Jul 2022 17:03:47 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/Romoff0KBTBP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/JamborTPH21,
  author       = {Dora Jambor and
                  Komal K. Teru and
                  Joelle Pineau and
                  William L. Hamilton},
  editor       = {Paola Merlo and
                  J{\"{o}}rg Tiedemann and
                  Reut Tsarfaty},
  title        = {Exploring the Limits of Few-Shot Link Prediction in Knowledge Graphs},
  booktitle    = {Proceedings of the 16th Conference of the European Chapter of the
                  Association for Computational Linguistics: Main Volume, {EACL} 2021,
                  Online, April 19 - 23, 2021},
  pages        = {2816--2822},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.eacl-main.245},
  doi          = {10.18653/V1/2021.EACL-MAIN.245},
  timestamp    = {Thu, 20 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eacl/JamborTPH21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SinhaJHPWK21,
  author       = {Koustuv Sinha and
                  Robin Jia and
                  Dieuwke Hupkes and
                  Joelle Pineau and
                  Adina Williams and
                  Douwe Kiela},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Masked Language Modeling and the Distributional Hypothesis: Order
                  Word Matters Pre-training for Little},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {2888--2913},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.230},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.230},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/SinhaJHPWK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ParthasarathiSP21,
  author       = {Prasanna Parthasarathi and
                  Koustuv Sinha and
                  Joelle Pineau and
                  Adina Williams},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Sometimes We Want Ungrammatical Translations},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November,
                  2021},
  pages        = {3205--3227},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-emnlp.275},
  doi          = {10.18653/V1/2021.FINDINGS-EMNLP.275},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ParthasarathiSP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/0001SKP21,
  author       = {Amy Zhang and
                  Shagun Sodhani and
                  Khimya Khetarpal and
                  Joelle Pineau},
  title        = {Learning Robust State Abstractions for Hidden-Parameter Block MDPs},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=fmOOI2a3tQP},
  timestamp    = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/0001SKP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/JeonSBDNP21,
  author       = {Wonseok Jeon and
                  Chen{-}Yang Su and
                  Paul Barde and
                  Thang Doan and
                  Derek Nowrouzezahrai and
                  Joelle Pineau},
  title        = {Regularized Inverse Reinforcement Learning},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=HgLO8yalfwc},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/JeonSBDNP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/0004JLPK21,
  author       = {Jongmin Lee and
                  Wonseok Jeon and
                  Byung{-}Jun Lee and
                  Joelle Pineau and
                  Kee{-}Eung Kim},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {OptiDICE: Offline Policy Optimization via Stationary Distribution
                  Correction Estimation},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {6120--6130},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/lee21f.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/0004JLPK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Sodhani0P21,
  author       = {Shagun Sodhani and
                  Amy Zhang and
                  Joelle Pineau},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Multi-Task Reinforcement Learning with Context-based Representations},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {9767--9779},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/sodhani21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/Sodhani0P21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SatijaTPL21,
  author       = {Harsh Satija and
                  Philip S. Thomas and
                  Joelle Pineau and
                  Romain Laroche},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Multi-Objective {SPIBB:} Seldonian Offline Policy Improvement with
                  Safety Constraints in Finite MDPs},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {2004--2017},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/0f65caf0a7d00afd2b87c028e88fe931-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SatijaTPL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigdial/ParthasarathiAC21,
  author       = {Prasanna Parthasarathi and
                  Mohamed A. Abdelsalam and
                  Sarath Chandar and
                  Joelle Pineau},
  editor       = {Haizhou Li and
                  Gina{-}Anne Levow and
                  Zhou Yu and
                  Chitralekha Gupta and
                  Berrak Sisman and
                  Siqi Cai and
                  David Vandyke and
                  Nina Dethlefs and
                  Yan Wu and
                  Junyi Jessy Li},
  title        = {A Brief Study on the Effects of Training Generative Dialogue Models
                  with a Semantic loss},
  booktitle    = {Proceedings of the 22nd Annual Meeting of the Special Interest Group
                  on Discourse and Dialogue, SIGdial 2021, Singapore and Online, July
                  29-31, 2021},
  pages        = {469--476},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.sigdial-1.49},
  doi          = {10.18653/V1/2021.SIGDIAL-1.49},
  timestamp    = {Thu, 15 Aug 2024 07:54:16 +0200},
  biburl       = {https://dblp.org/rec/conf/sigdial/ParthasarathiAC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigdial/ParthasarathiPC21,
  author       = {Prasanna Parthasarathi and
                  Joelle Pineau and
                  Sarath Chandar},
  editor       = {Haizhou Li and
                  Gina{-}Anne Levow and
                  Zhou Yu and
                  Chitralekha Gupta and
                  Berrak Sisman and
                  Siqi Cai and
                  David Vandyke and
                  Nina Dethlefs and
                  Yan Wu and
                  Junyi Jessy Li},
  title        = {Do Encoder Representations of Generative Dialogue Models have sufficient
                  summary of the Information about the task ?},
  booktitle    = {Proceedings of the 22nd Annual Meeting of the Special Interest Group
                  on Discourse and Dialogue, SIGdial 2021, Singapore and Online, July
                  29-31, 2021},
  pages        = {477--488},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.sigdial-1.50},
  doi          = {10.18653/V1/2021.SIGDIAL-1.50},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigdial/ParthasarathiPC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wcssl/CacciaP21,
  author       = {Lucas Caccia and
                  Joelle Pineau},
  editor       = {Fabio Cuzzolin and
                  Kevin Cannons and
                  Vincenzo Lomonaco},
  title        = {SPeCiaL: Self-supervised Pretraining for Continual Learning},
  booktitle    = {Continual Semi-Supervised Learning - First International Workshop,
                  {CSSL} 2021, Virtual Event, August 19-20, 2021, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {13418},
  pages        = {91--103},
  publisher    = {Springer},
  year         = {2021},
  url          = {https://doi.org/10.1007/978-3-031-17587-9\_7},
  doi          = {10.1007/978-3-031-17587-9\_7},
  timestamp    = {Fri, 07 Oct 2022 15:35:11 +0200},
  biburl       = {https://dblp.org/rec/conf/wcssl/CacciaP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:series/lncs/DelacroixPM21,
  author       = {Sylvie Delacroix and
                  Joelle Pineau and
                  Jessica Montgomery},
  editor       = {Bertrand Braunschweig and
                  Malik Ghallab},
  title        = {Democratising the Digital Revolution: The Role of Data Governance},
  booktitle    = {Reflections on Artificial Intelligence for Humanity},
  series       = {Lecture Notes in Computer Science},
  volume       = {12600},
  pages        = {40--52},
  publisher    = {Springer},
  year         = {2021},
  url          = {https://doi.org/10.1007/978-3-030-69128-8\_3},
  doi          = {10.1007/978-3-030-69128-8\_3},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/series/lncs/DelacroixPM21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-00010,
  author       = {Koustuv Sinha and
                  Prasanna Parthasarathi and
                  Joelle Pineau and
                  Adina Williams},
  title        = {Unnatural Language Inference},
  journal      = {CoRR},
  volume       = {abs/2101.00010},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.00010},
  eprinttype    = {arXiv},
  eprint       = {2101.00010},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-00010.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-04909,
  author       = {Anuroop Sriram and
                  Matthew J. Muckley and
                  Koustuv Sinha and
                  Farah Shamout and
                  Joelle Pineau and
                  Krzysztof J. Geras and
                  Lea Azour and
                  Yindalon Aphinyanaphongs and
                  Nafissa Yakubova and
                  William Moore},
  title        = {{COVID-19} Prognosis via Self-Supervised Representation Learning and
                  Multi-Image Prediction},
  journal      = {CoRR},
  volume       = {abs/2101.04909},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.04909},
  eprinttype    = {arXiv},
  eprint       = {2101.04909},
  timestamp    = {Sat, 30 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-04909.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-03419,
  author       = {Dora Jambor and
                  Komal K. Teru and
                  Joelle Pineau and
                  William L. Hamilton},
  title        = {Exploring the Limits of Few-Shot Link Prediction in Knowledge Graphs},
  journal      = {CoRR},
  volume       = {abs/2102.03419},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.03419},
  eprinttype    = {arXiv},
  eprint       = {2102.03419},
  timestamp    = {Wed, 10 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-03419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-06177,
  author       = {Shagun Sodhani and
                  Amy Zhang and
                  Joelle Pineau},
  title        = {Multi-Task Reinforcement Learning with Context-based Representations},
  journal      = {CoRR},
  volume       = {abs/2102.06177},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.06177},
  eprinttype    = {arXiv},
  eprint       = {2102.06177},
  timestamp    = {Thu, 18 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-06177.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-07097,
  author       = {Bonnie Li and
                  Vincent Fran{\c{c}}ois{-}Lavet and
                  Thang Doan and
                  Joelle Pineau},
  title        = {Domain Adversarial Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2102.07097},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.07097},
  eprinttype    = {arXiv},
  eprint       = {2102.07097},
  timestamp    = {Thu, 18 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-07097.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-09850,
  author       = {Manan Tomar and
                  Amy Zhang and
                  Roberto Calandra and
                  Matthew E. Taylor and
                  Joelle Pineau},
  title        = {Model-Invariant State Abstractions for Model-Based Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2102.09850},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.09850},
  eprinttype    = {arXiv},
  eprint       = {2102.09850},
  timestamp    = {Wed, 24 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-09850.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-08067,
  author       = {Kalesha Bullard and
                  Douwe Kiela and
                  Joelle Pineau and
                  Jakob N. Foerster},
  title        = {Quasi-Equivalence Discovery for Zero-Shot Emergent Communication},
  journal      = {CoRR},
  volume       = {abs/2103.08067},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.08067},
  eprinttype    = {arXiv},
  eprint       = {2103.08067},
  timestamp    = {Tue, 23 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-08067.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-05025,
  author       = {Lucas Caccia and
                  Rahaf Aljundi and
                  Tinne Tuytelaars and
                  Joelle Pineau and
                  Eugene Belilovsky},
  title        = {Reducing Representation Drift in Online Continual Learning},
  journal      = {CoRR},
  volume       = {abs/2104.05025},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.05025},
  eprinttype    = {arXiv},
  eprint       = {2104.05025},
  timestamp    = {Mon, 19 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-05025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-06644,
  author       = {Koustuv Sinha and
                  Robin Jia and
                  Dieuwke Hupkes and
                  Joelle Pineau and
                  Adina Williams and
                  Douwe Kiela},
  title        = {Masked Language Modeling and the Distributional Hypothesis: Order
                  Word Matters Pre-training for Little},
  journal      = {CoRR},
  volume       = {abs/2104.06644},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.06644},
  eprinttype    = {arXiv},
  eprint       = {2104.06644},
  timestamp    = {Mon, 19 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-06644.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-07623,
  author       = {Prasanna Parthasarathi and
                  Koustuv Sinha and
                  Joelle Pineau and
                  Adina Williams},
  title        = {Sometimes We Want Translationese},
  journal      = {CoRR},
  volume       = {abs/2104.07623},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.07623},
  eprinttype    = {arXiv},
  eprint       = {2104.07623},
  timestamp    = {Mon, 19 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-07623.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-00099,
  author       = {Harsh Satija and
                  Philip S. Thomas and
                  Joelle Pineau and
                  Romain Laroche},
  title        = {Multi-Objective {SPIBB:} Seldonian Offline Policy Improvement with
                  Safety Constraints in Finite MDPs},
  journal      = {CoRR},
  volume       = {abs/2106.00099},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.00099},
  eprinttype    = {arXiv},
  eprint       = {2106.00099},
  timestamp    = {Wed, 09 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-00099.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-03955,
  author       = {Emmanuel Bengio and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Correcting Momentum in Temporal Difference Learning},
  journal      = {CoRR},
  volume       = {abs/2106.03955},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.03955},
  eprinttype    = {arXiv},
  eprint       = {2106.03955},
  timestamp    = {Thu, 10 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-03955.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-09065,
  author       = {Lucas Caccia and
                  Joelle Pineau},
  title        = {SPeCiaL: Self-Supervised Pretraining for Continual Learning},
  journal      = {CoRR},
  volume       = {abs/2106.09065},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.09065},
  eprinttype    = {arXiv},
  eprint       = {2106.09065},
  timestamp    = {Tue, 29 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-09065.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-10619,
  author       = {Prasanna Parthasarathi and
                  Mohamed A. Abdelsalam and
                  Joelle Pineau and
                  Sarath Chandar},
  title        = {A Brief Study on the Effects of Training Generative Dialogue Models
                  with a Semantic loss},
  journal      = {CoRR},
  volume       = {abs/2106.10619},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.10619},
  eprinttype    = {arXiv},
  eprint       = {2106.10619},
  timestamp    = {Tue, 09 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-10619.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-10622,
  author       = {Prasanna Parthasarathi and
                  Joelle Pineau and
                  Sarath Chandar},
  title        = {Do Encoder Representations of Generative Dialogue Models Encode Sufficient
                  Information about the Task ?},
  journal      = {CoRR},
  volume       = {abs/2106.10622},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.10622},
  eprinttype    = {arXiv},
  eprint       = {2106.10622},
  timestamp    = {Tue, 29 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-10622.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-10783,
  author       = {Jongmin Lee and
                  Wonseok Jeon and
                  Byung{-}Jun Lee and
                  Joelle Pineau and
                  Kee{-}Eung Kim},
  title        = {OptiDICE: Offline Policy Optimization via Stationary Distribution
                  Correction Estimation},
  journal      = {CoRR},
  volume       = {abs/2106.10783},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.10783},
  eprinttype    = {arXiv},
  eprint       = {2106.10783},
  timestamp    = {Wed, 30 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-10783.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-06972,
  author       = {Shagun Sodhani and
                  Franziska Meier and
                  Joelle Pineau and
                  Amy Zhang},
  title        = {Block Contextual MDPs for Continual Learning},
  journal      = {CoRR},
  volume       = {abs/2110.06972},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.06972},
  eprinttype    = {arXiv},
  eprint       = {2110.06972},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-06972.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/SerbanSPPB20,
  author       = {Iulian Vlad Serban and
                  Chinnadhurai Sankar and
                  Michael Pieper and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {The Bottleneck Simulator: {A} Model-Based Deep Reinforcement Learning
                  Approach},
  journal      = {J. Artif. Intell. Res.},
  volume       = {69},
  pages        = {571--612},
  year         = {2020},
  url          = {https://doi.org/10.1613/jair.1.12463},
  doi          = {10.1613/JAIR.1.12463},
  timestamp    = {Fri, 06 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/SerbanSPPB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/natmi/Peiffer-SmadjaM20,
  author       = {Nathan Peiffer{-}Smadja and
                  Redwan Maatoug and
                  Fran{\c{c}}ois{-}Xavier Lescure and
                  Eric D'ortenzio and
                  Joelle Pineau and
                  Jean{-}R{\'{e}}mi King},
  title        = {Machine Learning for {COVID-19} needs global collaboration and data-sharing},
  journal      = {Nat. Mach. Intell.},
  volume       = {2},
  number       = {6},
  pages        = {293--294},
  year         = {2020},
  url          = {https://doi.org/10.1038/s42256-020-0181-6},
  doi          = {10.1038/S42256-020-0181-6},
  timestamp    = {Wed, 15 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/natmi/Peiffer-SmadjaM20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CrawfordP20,
  author       = {Eric Crawford and
                  Joelle Pineau},
  title        = {Exploiting Spatial Invariance for Scalable Unsupervised Object Tracking},
  booktitle    = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2020, The Thirty-Second Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA,
                  February 7-12, 2020},
  pages        = {3684--3692},
  publisher    = {{AAAI} Press},
  year         = {2020},
  url          = {https://doi.org/10.1609/aaai.v34i04.5777},
  doi          = {10.1609/AAAI.V34I04.5777},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/CrawfordP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ZhangDP20,
  author       = {Qizhen Zhang and
                  Audrey Durand and
                  Joelle Pineau},
  title        = {Literature Mining for Incorporating Inductive Bias in Biomedical Prediction
                  Tasks (Student Abstract)},
  booktitle    = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2020, The Thirty-Second Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA,
                  February 7-12, 2020},
  pages        = {13983--13984},
  publisher    = {{AAAI} Press},
  year         = {2020},
  url          = {https://doi.org/10.1609/aaai.v34i10.7264},
  doi          = {10.1609/AAAI.V34I10.7264},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ZhangDP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SinhaPWLHP20,
  author       = {Koustuv Sinha and
                  Prasanna Parthasarathi and
                  Jasmine Wang and
                  Ryan Lowe and
                  William L. Hamilton and
                  Joelle Pineau},
  editor       = {Dan Jurafsky and
                  Joyce Chai and
                  Natalie Schluter and
                  Joel R. Tetreault},
  title        = {Learning an Unreferenced Metric for Online Dialogue Evaluation},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2020, Online, July 5-10, 2020},
  pages        = {2430--2441},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-main.220},
  doi          = {10.18653/V1/2020.ACL-MAIN.220},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SinhaPWLHP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aied/KochmarVBGSP20,
  author       = {Ekaterina Kochmar and
                  Dung Do Vu and
                  Robert Belfer and
                  Varun Gupta and
                  Iulian Vlad Serban and
                  Joelle Pineau},
  editor       = {Ig Ibert Bittencourt and
                  Mutlu Cukurova and
                  Kasia Muldner and
                  Rose Luckin and
                  Eva Mill{\'{a}}n},
  title        = {Automated Personalized Feedback Improves Learning Gains in An Intelligent
                  Tutoring System},
  booktitle    = {Artificial Intelligence in Education - 21st International Conference,
                  {AIED} 2020, Ifrane, Morocco, July 6-10, 2020, Proceedings, Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12164},
  pages        = {140--146},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-52240-7\_26},
  doi          = {10.1007/978-3-030-52240-7\_26},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aied/KochmarVBGSP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aied/SerbanGKVBPCCB20,
  author       = {Iulian Vlad Serban and
                  Varun Gupta and
                  Ekaterina Kochmar and
                  Dung Do Vu and
                  Robert Belfer and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Laurent Charlin and
                  Yoshua Bengio},
  editor       = {Ig Ibert Bittencourt and
                  Mutlu Cukurova and
                  Kasia Muldner and
                  Rose Luckin and
                  Eva Mill{\'{a}}n},
  title        = {A Large-Scale, Open-Domain, Mixed-Interface Dialogue-Based {ITS} for
                  {STEM}},
  booktitle    = {Artificial Intelligence in Education - 21st International Conference,
                  {AIED} 2020, Ifrane, Morocco, July 6-10, 2020, Proceedings, Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12164},
  pages        = {387--392},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-52240-7\_70},
  doi          = {10.1007/978-3-030-52240-7\_70},
  timestamp    = {Tue, 07 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aied/SerbanGKVBPCCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/debs/Pineau20,
  author       = {Joelle Pineau},
  editor       = {Julien Gascon{-}Samson and
                  Kaiwen Zhang and
                  Khuzaima Daudjee and
                  Bettina Kemme},
  title        = {Building reproducible, reusable, and robust machine learning software},
  booktitle    = {14th {ACM} International Conference on Distributed and Event-based
                  Systems, {DEBS} 2020, Montreal, Quebec, Canada, July 13-17, 2020},
  pages        = {2},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3401025.3407941},
  doi          = {10.1145/3401025.3407941},
  timestamp    = {Wed, 20 Jul 2022 14:24:56 +0200},
  biburl       = {https://dblp.org/rec/conf/debs/Pineau20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/CacciaCFLPC20,
  author       = {Massimo Caccia and
                  Lucas Caccia and
                  William Fedus and
                  Hugo Larochelle and
                  Joelle Pineau and
                  Laurent Charlin},
  title        = {Language GANs Falling Short},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=BJgza6VtPB},
  timestamp    = {Thu, 07 May 2020 17:11:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/CacciaCFLPC20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Lowe0FKP20,
  author       = {Ryan Lowe and
                  Abhinav Gupta and
                  Jakob N. Foerster and
                  Douwe Kiela and
                  Joelle Pineau},
  title        = {On the interaction between supervision and self-play in emergent communication},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=rJxGLlBtwH},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Lowe0FKP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BengioPP20,
  author       = {Emmanuel Bengio and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Interference and Generalization in Temporal Difference Learning},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {767--777},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/bengio20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/BengioPP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/CacciaBCP20,
  author       = {Lucas Caccia and
                  Eugene Belilovsky and
                  Massimo Caccia and
                  Joelle Pineau},
  title        = {Online Learned Continual Compression with Adaptive Quantization Modules},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {1240--1250},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/caccia20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/CacciaBCP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/SatijaAP20,
  author       = {Harsh Satija and
                  Philip Amortila and
                  Joelle Pineau},
  title        = {Constrained Markov Decision Processes via Backward Value Functions},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {8502--8511},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/satija20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/SatijaAP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/0001LSFKPGP20,
  author       = {Amy Zhang and
                  Clare Lyle and
                  Shagun Sodhani and
                  Angelos Filos and
                  Marta Kwiatkowska and
                  Joelle Pineau and
                  Yarin Gal and
                  Doina Precup},
  title        = {Invariant Causal Prediction for Block MDPs},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {11214--11224},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/zhang20t.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/0001LSFKPGP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/WabarthaDFP20,
  author       = {Maxime Wabartha and
                  Audrey Durand and
                  Vincent Fran{\c{c}}ois{-}Lavet and
                  Joelle Pineau},
  editor       = {Christian Bessiere},
  title        = {Handling Black Swan Events in Deep Learning with Diversely Extrapolated
                  Neural Networks},
  booktitle    = {Proceedings of the Twenty-Ninth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2020},
  pages        = {2140--2147},
  publisher    = {ijcai.org},
  year         = {2020},
  url          = {https://doi.org/10.24963/ijcai.2020/296},
  doi          = {10.24963/IJCAI.2020/296},
  timestamp    = {Mon, 20 Jul 2020 12:38:52 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/WabarthaDFP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/Francois-LavetR20,
  author       = {Vincent Fran{\c{c}}ois{-}Lavet and
                  Guillaume Rabusseau and
                  Joelle Pineau and
                  Damien Ernst and
                  Raphael Fonteneau},
  editor       = {Christian Bessiere},
  title        = {On Overfitting and Asymptotic Bias in Batch Reinforcement Learning
                  with Partial Observability (Extended Abstract)},
  booktitle    = {Proceedings of the Twenty-Ninth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2020},
  pages        = {5055--5059},
  publisher    = {ijcai.org},
  year         = {2020},
  url          = {https://doi.org/10.24963/ijcai.2020/706},
  doi          = {10.24963/IJCAI.2020/706},
  timestamp    = {Wed, 15 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/Francois-LavetR20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/l4dc/Yang0MPAC20,
  author       = {Ge Yang and
                  Amy Zhang and
                  Ari S. Morcos and
                  Joelle Pineau and
                  Pieter Abbeel and
                  Roberto Calandra},
  editor       = {Alexandre M. Bayen and
                  Ali Jadbabaie and
                  George J. Pappas and
                  Pablo A. Parrilo and
                  Benjamin Recht and
                  Claire J. Tomlin and
                  Melanie N. Zeilinger},
  title        = {Plan2Vec: Unsupervised Representation Learning by Latent Plans},
  booktitle    = {Proceedings of the 2nd Annual Conference on Learning for Dynamics
                  and Control, {L4DC} 2020, Online Event, Berkeley, CA, USA, 11-12 June
                  2020},
  series       = {Proceedings of Machine Learning Research},
  volume       = {120},
  pages        = {935--946},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v120/yang20b.html},
  timestamp    = {Fri, 07 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/l4dc/Yang0MPAC20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BardeRJPPN20,
  author       = {Paul Barde and
                  Julien Roy and
                  Wonseok Jeon and
                  Joelle Pineau and
                  Chris Pal and
                  Derek Nowrouzezahrai},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Adversarial Soft Advantage Fitting: Imitation Learning without Policy
                  Optimization},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/9161ab7a1b61012c4c303f10b4c16b2c-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BardeRJPPN20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/TaoFP20,
  author       = {Ruo Yu Tao and
                  Vincent Fran{\c{c}}ois{-}Lavet and
                  Joelle Pineau},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Novelty Search in Representational Space for Sample Efficient Exploration},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/5ca41a86596a5ed567d15af0be224952-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/TaoFP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/Touati0PV20,
  author       = {Ahmed Touati and
                  Amy Zhang and
                  Joelle Pineau and
                  Pascal Vincent},
  editor       = {Ryan P. Adams and
                  Vibhav Gogate},
  title        = {Stable Policy Optimization via Off-Policy Divergence Regularization},
  booktitle    = {Proceedings of the Thirty-Sixth Conference on Uncertainty in Artificial
                  Intelligence, {UAI} 2020, virtual online, August 3-6, 2020},
  series       = {Proceedings of Machine Learning Research},
  volume       = {124},
  pages        = {1328--1337},
  publisher    = {{AUAI} Press},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v124/touati20a.html},
  timestamp    = {Tue, 07 May 2024 20:09:01 +0200},
  biburl       = {https://dblp.org/rec/conf/uai/Touati0PV20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-01093,
  author       = {Ryan Lowe and
                  Abhinav Gupta and
                  Jakob N. Foerster and
                  Douwe Kiela and
                  Joelle Pineau},
  title        = {On the interaction between supervision and self-play in emergent communication},
  journal      = {CoRR},
  volume       = {abs/2002.01093},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.01093},
  eprinttype    = {arXiv},
  eprint       = {2002.01093},
  timestamp    = {Mon, 15 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-01093.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-02863,
  author       = {Bogdan Mazoure and
                  Thang Doan and
                  Tianyu Li and
                  Vladimir Makarenkov and
                  Joelle Pineau and
                  Doina Precup and
                  Guillaume Rabusseau},
  title        = {Provably efficient reconstruction of policy networks},
  journal      = {CoRR},
  volume       = {abs/2002.02863},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02863},
  eprinttype    = {arXiv},
  eprint       = {2002.02863},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02863.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-05651,
  author       = {Peter Henderson and
                  Jieru Hu and
                  Joshua Romoff and
                  Emma Brunskill and
                  Dan Jurafsky and
                  Joelle Pineau},
  title        = {Towards the Systematic Reporting of the Energy and Carbon Footprints
                  of Machine Learning},
  journal      = {CoRR},
  volume       = {abs/2002.05651},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.05651},
  eprinttype    = {arXiv},
  eprint       = {2002.05651},
  timestamp    = {Fri, 14 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-05651.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-10525,
  author       = {Wonseok Jeon and
                  Paul Barde and
                  Derek Nowrouzezahrai and
                  Joelle Pineau},
  title        = {Scalable Multi-Agent Inverse Reinforcement Learning via Actor-Attention-Critic},
  journal      = {CoRR},
  volume       = {abs/2002.10525},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.10525},
  eprinttype    = {arXiv},
  eprint       = {2002.10525},
  timestamp    = {Tue, 03 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-10525.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-04108,
  author       = {Ahmed Touati and
                  Amy Zhang and
                  Joelle Pineau and
                  Pascal Vincent},
  title        = {Stable Policy Optimization via Off-Policy Divergence Regularization},
  journal      = {CoRR},
  volume       = {abs/2003.04108},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.04108},
  eprinttype    = {arXiv},
  eprint       = {2003.04108},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-04108.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-06016,
  author       = {Amy Zhang and
                  Clare Lyle and
                  Shagun Sodhani and
                  Angelos Filos and
                  Marta Kwiatkowska and
                  Joelle Pineau and
                  Yarin Gal and
                  Doina Precup},
  title        = {Invariant Causal Prediction for Block MDPs},
  journal      = {CoRR},
  volume       = {abs/2003.06016},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.06016},
  eprinttype    = {arXiv},
  eprint       = {2003.06016},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-06016.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-06350,
  author       = {Emmanuel Bengio and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Interference and Generalization in Temporal Difference Learning},
  journal      = {CoRR},
  volume       = {abs/2003.06350},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.06350},
  eprinttype    = {arXiv},
  eprint       = {2003.06350},
  timestamp    = {Tue, 17 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-06350.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-06560,
  author       = {Koustuv Sinha and
                  Shagun Sodhani and
                  Joelle Pineau and
                  William L. Hamilton},
  title        = {Evaluating Logical Generalization in Graph Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2003.06560},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.06560},
  eprinttype    = {arXiv},
  eprint       = {2003.06560},
  timestamp    = {Tue, 17 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-06560.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-12206,
  author       = {Joelle Pineau and
                  Philippe Vincent{-}Lamarre and
                  Koustuv Sinha and
                  Vincent Larivi{\`{e}}re and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Hugo Larochelle},
  title        = {Improving Reproducibility in Machine Learning Research {(A} Report
                  from the NeurIPS 2019 Reproducibility Program)},
  journal      = {CoRR},
  volume       = {abs/2003.12206},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.12206},
  eprinttype    = {arXiv},
  eprint       = {2003.12206},
  timestamp    = {Wed, 01 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-12206.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-00583,
  author       = {Koustuv Sinha and
                  Prasanna Parthasarathi and
                  Jasmine Wang and
                  Ryan Lowe and
                  William L. Hamilton and
                  Joelle Pineau},
  title        = {Learning an Unreferenced Metric for Online Dialogue Evaluation},
  journal      = {CoRR},
  volume       = {abs/2005.00583},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.00583},
  eprinttype    = {arXiv},
  eprint       = {2005.00583},
  timestamp    = {Fri, 08 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-00583.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-02431,
  author       = {Ekaterina Kochmar and
                  Dung Do Vu and
                  Robert Belfer and
                  Varun Gupta and
                  Iulian Vlad Serban and
                  Joelle Pineau},
  title        = {Automated Personalized Feedback Improves Learning Gains in an Intelligent
                  Tutoring System},
  journal      = {CoRR},
  volume       = {abs/2005.02431},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.02431},
  eprinttype    = {arXiv},
  eprint       = {2005.02431},
  timestamp    = {Sat, 09 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-02431.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-03648,
  author       = {Ge Yang and
                  Amy Zhang and
                  Ari S. Morcos and
                  Joelle Pineau and
                  Pieter Abbeel and
                  Roberto Calandra},
  title        = {Plan2Vec: Unsupervised Representation Learning by Latent Plans},
  journal      = {CoRR},
  volume       = {abs/2005.03648},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.03648},
  eprinttype    = {arXiv},
  eprint       = {2005.03648},
  timestamp    = {Fri, 07 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-03648.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-06616,
  author       = {Iulian Vlad Serban and
                  Varun Gupta and
                  Ekaterina Kochmar and
                  Dung Do Vu and
                  Robert Belfer and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Laurent Charlin and
                  Yoshua Bengio},
  title        = {A Large-Scale, Open-Domain, Mixed-Interface Dialogue-Based {ITS} for
                  {STEM}},
  journal      = {CoRR},
  volume       = {abs/2005.06616},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.06616},
  eprinttype    = {arXiv},
  eprint       = {2005.06616},
  timestamp    = {Fri, 22 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-06616.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-13258,
  author       = {Paul Barde and
                  Julien Roy and
                  Wonseok Jeon and
                  Joelle Pineau and
                  Christopher J. Pal and
                  Derek Nowrouzezahrai},
  title        = {Adversarial Soft Advantage Fitting: Imitation Learning without Policy
                  Optimization},
  journal      = {CoRR},
  volume       = {abs/2006.13258},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.13258},
  eprinttype    = {arXiv},
  eprint       = {2006.13258},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-13258.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-01516,
  author       = {Deepak Sharma and
                  Audrey Durand and
                  Marc{-}Andr{\'{e}} Legault and
                  Louis{-}Philippe Lemieux Perreault and
                  Audrey Lema{\c{c}}on and
                  Marie{-}Pierre Dub{\'{e}} and
                  Joelle Pineau},
  title        = {Deep interpretability for {GWAS}},
  journal      = {CoRR},
  volume       = {abs/2007.01516},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.01516},
  eprinttype    = {arXiv},
  eprint       = {2007.01516},
  timestamp    = {Mon, 06 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-01516.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-02786,
  author       = {Joshua Romoff and
                  Peter Henderson and
                  David Kanaa and
                  Emmanuel Bengio and
                  Ahmed Touati and
                  Pierre{-}Luc Bacon and
                  Joelle Pineau},
  title        = {TDprop: Does Jacobi Preconditioning Help Temporal Difference Learning?},
  journal      = {CoRR},
  volume       = {abs/2007.02786},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.02786},
  eprinttype    = {arXiv},
  eprint       = {2007.02786},
  timestamp    = {Sat, 18 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-02786.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-07206,
  author       = {Amy Zhang and
                  Shagun Sodhani and
                  Khimya Khetarpal and
                  Joelle Pineau},
  title        = {Multi-Task Reinforcement Learning as a Hidden-Parameter Block {MDP}},
  journal      = {CoRR},
  volume       = {abs/2007.07206},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.07206},
  eprinttype    = {arXiv},
  eprint       = {2007.07206},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-07206.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-10427,
  author       = {Prasanna Parthasarathi and
                  Joelle Pineau and
                  Sarath Chandar},
  title        = {How To Evaluate Your Dialogue System: Probe Tasks as an Alternative
                  for Token-level Evaluation Metrics},
  journal      = {CoRR},
  volume       = {abs/2008.10427},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.10427},
  eprinttype    = {arXiv},
  eprint       = {2008.10427},
  timestamp    = {Fri, 28 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-10427.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-11811,
  author       = {Harsh Satija and
                  Philip Amortila and
                  Joelle Pineau},
  title        = {Constrained Markov Decision Processes via Backward Value Functions},
  journal      = {CoRR},
  volume       = {abs/2008.11811},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.11811},
  eprinttype    = {arXiv},
  eprint       = {2008.11811},
  timestamp    = {Tue, 15 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-11811.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-13579,
  author       = {Ruo Yu Tao and
                  Vincent Fran{\c{c}}ois{-}Lavet and
                  Joelle Pineau},
  title        = {Novelty Search in representational space for sample efficient exploration},
  journal      = {CoRR},
  volume       = {abs/2009.13579},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.13579},
  eprinttype    = {arXiv},
  eprint       = {2009.13579},
  timestamp    = {Wed, 30 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-13579.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-03691,
  author       = {Wonseok Jeon and
                  Chen{-}Yang Su and
                  Paul Barde and
                  Thang Doan and
                  Derek Nowrouzezahrai and
                  Joelle Pineau},
  title        = {Regularized Inverse Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2010.03691},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.03691},
  eprinttype    = {arXiv},
  eprint       = {2010.03691},
  timestamp    = {Tue, 13 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-03691.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-15896,
  author       = {Kalesha Bullard and
                  Franziska Meier and
                  Douwe Kiela and
                  Joelle Pineau and
                  Jakob N. Foerster},
  title        = {Exploring Zero-Shot Emergent Communication in Embodied Multi-Agent
                  Populations},
  journal      = {CoRR},
  volume       = {abs/2010.15896},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.15896},
  eprinttype    = {arXiv},
  eprint       = {2010.15896},
  timestamp    = {Tue, 03 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-15896.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-02055,
  author       = {Melissa Mozifian and
                  Amy Zhang and
                  Joelle Pineau and
                  David Meger},
  title        = {Intervention Design for Effective Sim2Real Transfer},
  journal      = {CoRR},
  volume       = {abs/2012.02055},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.02055},
  eprinttype    = {arXiv},
  eprint       = {2012.02055},
  timestamp    = {Fri, 04 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-02055.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/Francois-LavetR19,
  author       = {Vincent Fran{\c{c}}ois{-}Lavet and
                  Guillaume Rabusseau and
                  Joelle Pineau and
                  Damien Ernst and
                  Raphael Fonteneau},
  title        = {On Overfitting and Asymptotic Bias in Batch Reinforcement Learning
                  with Partial Observability},
  journal      = {J. Artif. Intell. Res.},
  volume       = {65},
  pages        = {1--30},
  year         = {2019},
  url          = {https://doi.org/10.1613/jair.1.11478},
  doi          = {10.1613/JAIR.1.11478},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jair/Francois-LavetR19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CrawfordP19,
  author       = {Eric Crawford and
                  Joelle Pineau},
  title        = {Spatially Invariant Unsupervised Object Detection with Convolutional
                  Neural Networks},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {3412--3420},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33013412},
  doi          = {10.1609/AAAI.V33I01.33013412},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/CrawfordP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DoanMAMDPH19,
  author       = {Thang Doan and
                  Jo{\~{a}}o Monteiro and
                  Isabela Albuquerque and
                  Bogdan Mazoure and
                  Audrey Durand and
                  Joelle Pineau and
                  R. Devon Hjelm},
  title        = {On-Line Adaptative Curriculum Learning for GANs},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {3470--3477},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33013470},
  doi          = {10.1609/AAAI.V33I01.33013470},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DoanMAMDPH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Francois-LavetB19,
  author       = {Vincent Fran{\c{c}}ois{-}Lavet and
                  Yoshua Bengio and
                  Doina Precup and
                  Joelle Pineau},
  title        = {Combined Reinforcement Learning via Abstract Representations},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {3582--3589},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33013582},
  doi          = {10.1609/AAAI.V33I01.33013582},
  timestamp    = {Tue, 02 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/Francois-LavetB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/WangZLSP19,
  author       = {Boyu Wang and
                  Hejia Zhang and
                  Peng Liu and
                  Zebang Shen and
                  Joelle Pineau},
  editor       = {Kamalika Chaudhuri and
                  Masashi Sugiyama},
  title        = {Multitask Metric Learning: Theory and Algorithm},
  booktitle    = {The 22nd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2019, 16-18 April 2019, Naha, Okinawa, Japan},
  series       = {Proceedings of Machine Learning Research},
  volume       = {89},
  pages        = {3362--3371},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v89/wang19f.html},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aistats/WangZLSP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/LoweFBPD19,
  author       = {Ryan Lowe and
                  Jakob N. Foerster and
                  Y{-}Lan Boureau and
                  Joelle Pineau and
                  Yann N. Dauphin},
  editor       = {Edith Elkind and
                  Manuela Veloso and
                  Noa Agmon and
                  Matthew E. Taylor},
  title        = {On the Pitfalls of Measuring Emergent Communication},
  booktitle    = {Proceedings of the 18th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17,
                  2019},
  pages        = {693--701},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2019},
  url          = {http://dl.acm.org/citation.cfm?id=3331757},
  timestamp    = {Wed, 24 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/LoweFBPD19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/MazoureDDPH19,
  author       = {Bogdan Mazoure and
                  Thang Doan and
                  Audrey Durand and
                  Joelle Pineau and
                  R. Devon Hjelm},
  editor       = {Leslie Pack Kaelbling and
                  Danica Kragic and
                  Komei Sugiura},
  title        = {Leveraging exploration in off-policy algorithms via normalizing flows},
  booktitle    = {3rd Annual Conference on Robot Learning, CoRL 2019, Osaka, Japan,
                  October 30 - November 1, 2019, Proceedings},
  series       = {Proceedings of Machine Learning Research},
  volume       = {100},
  pages        = {430--444},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v100/mazoure20a.html},
  timestamp    = {Mon, 25 May 2020 12:12:52 +0200},
  biburl       = {https://dblp.org/rec/conf/corl/MazoureDDPH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/GuptaLFKP19,
  author       = {Abhinav Gupta and
                  Ryan Lowe and
                  Jakob N. Foerster and
                  Douwe Kiela and
                  Joelle Pineau},
  editor       = {Aditya Mogadala and
                  Dietrich Klakow and
                  Sandro Pezzelle and
                  Marie{-}Francine Moens},
  title        = {Seeded self-play for language learning},
  booktitle    = {Proceedings of the Beyond Vision and LANguage: inTEgrating Real-world
                  kNowledge, LANTERN@EMNLP-IJCNLP 2019, Hong Kong, China, November 3,
                  2019},
  pages        = {62--66},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-6409},
  doi          = {10.18653/V1/D19-6409},
  timestamp    = {Fri, 06 Aug 2021 00:40:22 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/GuptaLFKP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SinhaSDPH19,
  author       = {Koustuv Sinha and
                  Shagun Sodhani and
                  Jin Dong and
                  Joelle Pineau and
                  William L. Hamilton},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {{CLUTRR:} {A} Diagnostic Benchmark for Inductive Reasoning from Text},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {4505--4514},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1458},
  doi          = {10.18653/V1/D19-1458},
  timestamp    = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SinhaSDPH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DasGRBPRP19,
  author       = {Abhishek Das and
                  Th{\'{e}}ophile Gervet and
                  Joshua Romoff and
                  Dhruv Batra and
                  Devi Parikh and
                  Mike Rabbat and
                  Joelle Pineau},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {TarMAC: Targeted Multi-Agent Communication},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {1538--1546},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/das19a.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DasGRBPRP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Romoff0TOPB19,
  author       = {Joshua Romoff and
                  Peter Henderson and
                  Ahmed Touati and
                  Yann Ollivier and
                  Joelle Pineau and
                  Emma Brunskill},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Separable value functions across time-scales},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {5468--5477},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/romoff19a.html},
  timestamp    = {Tue, 11 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/Romoff0TOPB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/CacciaHCP19,
  author       = {Lucas Caccia and
                  Herke van Hoof and
                  Aaron C. Courville and
                  Joelle Pineau},
  title        = {Deep Generative Modeling of LiDAR Data},
  booktitle    = {2019 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2019, Macau, SAR, China, November 3-8, 2019},
  pages        = {5034--5040},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/IROS40897.2019.8968535},
  doi          = {10.1109/IROS40897.2019.8968535},
  timestamp    = {Fri, 31 Jan 2020 10:27:14 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/CacciaHCP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PaquetteLBSOKPS19,
  author       = {Philip Paquette and
                  Yuchen Lu and
                  Steven Bocco and
                  Max O. Smith and
                  Satya Ortiz{-}Gagne and
                  Jonathan K. Kummerfeld and
                  Joelle Pineau and
                  Satinder Singh and
                  Aaron C. Courville},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {No-Press Diplomacy: Modeling Multi-Agent Gameplay},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {4476--4487},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/84b20b1f5a0d103f5710bb67a043cd78-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/PaquetteLBSOKPS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/AssranRBPR19,
  author       = {Mahmoud Assran and
                  Joshua Romoff and
                  Nicolas Ballas and
                  Joelle Pineau and
                  Mike Rabbat},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Gossip-based Actor-Learner Architectures for Deep Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {13299--13309},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/a1a527267c0d33a86382a03c4c721cd2-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/AssranRBPR19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/TouatiSRPV19,
  author       = {Ahmed Touati and
                  Harsh Satija and
                  Joshua Romoff and
                  Joelle Pineau and
                  Pascal Vincent},
  editor       = {Amir Globerson and
                  Ricardo Silva},
  title        = {Randomized Value Functions via Multiplicative Normalizing Flows},
  booktitle    = {Proceedings of the Thirty-Fifth Conference on Uncertainty in Artificial
                  Intelligence, {UAI} 2019, Tel Aviv, Israel, July 22-25, 2019},
  series       = {Proceedings of Machine Learning Research},
  volume       = {115},
  pages        = {422--432},
  publisher    = {{AUAI} Press},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v115/touati20a.html},
  timestamp    = {Tue, 15 Dec 2020 17:40:18 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/TouatiSRPV19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-00098,
  author       = {Emily Dinan and
                  Varvara Logacheva and
                  Valentin Malykh and
                  Alexander H. Miller and
                  Kurt Shuster and
                  Jack Urbanek and
                  Douwe Kiela and
                  Arthur Szlam and
                  Iulian Serban and
                  Ryan Lowe and
                  Shrimai Prabhumoye and
                  Alan W. Black and
                  Alexander I. Rudnicky and
                  Jason D. Williams and
                  Joelle Pineau and
                  Mikhail Burtsev and
                  Jason Weston},
  title        = {The Second Conversational Intelligence Challenge (ConvAI2)},
  journal      = {CoRR},
  volume       = {abs/1902.00098},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.00098},
  eprinttype    = {arXiv},
  eprint       = {1902.00098},
  timestamp    = {Fri, 01 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-00098.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-01883,
  author       = {Joshua Romoff and
                  Peter Henderson and
                  Ahmed Touati and
                  Yann Ollivier and
                  Emma Brunskill and
                  Joelle Pineau},
  title        = {Separating value functions across time-scales},
  journal      = {CoRR},
  volume       = {abs/1902.01883},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.01883},
  eprinttype    = {arXiv},
  eprint       = {1902.01883},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-01883.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-05168,
  author       = {Ryan Lowe and
                  Jakob N. Foerster and
                  Y{-}Lan Boureau and
                  Joelle Pineau and
                  Yann N. Dauphin},
  title        = {On the Pitfalls of Measuring Emergent Communication},
  journal      = {CoRR},
  volume       = {abs/1903.05168},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.05168},
  eprinttype    = {arXiv},
  eprint       = {1903.05168},
  timestamp    = {Wed, 24 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-05168.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-06893,
  author       = {Bogdan Mazoure and
                  Thang Doan and
                  Audrey Durand and
                  R. Devon Hjelm and
                  Joelle Pineau},
  title        = {Leveraging exploration in off-policy algorithms via normalizing flows},
  journal      = {CoRR},
  volume       = {abs/1905.06893},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.06893},
  eprinttype    = {arXiv},
  eprint       = {1905.06893},
  timestamp    = {Tue, 28 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-06893.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-09562,
  author       = {Pierre Thodoroff and
                  Nishanth Anand and
                  Lucas Caccia and
                  Doina Precup and
                  Joelle Pineau},
  title        = {Recurrent Value Functions},
  journal      = {CoRR},
  volume       = {abs/1905.09562},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.09562},
  eprinttype    = {arXiv},
  eprint       = {1905.09562},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-09562.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-04585,
  author       = {Mahmoud Assran and
                  Joshua Romoff and
                  Nicolas Ballas and
                  Joelle Pineau and
                  Mike Rabbat},
  title        = {Gossip-based Actor-Learner Architectures for Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1906.04585},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.04585},
  eprinttype    = {arXiv},
  eprint       = {1906.04585},
  timestamp    = {Fri, 14 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-04585.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-10437,
  author       = {Amy Zhang and
                  Zachary C. Lipton and
                  Luis Pineda and
                  Kamyar Azizzadenesheli and
                  Anima Anandkumar and
                  Laurent Itti and
                  Joelle Pineau and
                  Tommaso Furlanello},
  title        = {Learning Causal State Representations of Partially Observable Environments},
  journal      = {CoRR},
  volume       = {abs/1906.10437},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.10437},
  eprinttype    = {arXiv},
  eprint       = {1906.10437},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-10437.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-06177,
  author       = {Koustuv Sinha and
                  Shagun Sodhani and
                  Jin Dong and
                  Joelle Pineau and
                  William L. Hamilton},
  title        = {{CLUTRR:} {A} Diagnostic Benchmark for Inductive Reasoning from Text},
  journal      = {CoRR},
  volume       = {abs/1908.06177},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.06177},
  eprinttype    = {arXiv},
  eprint       = {1908.06177},
  timestamp    = {Mon, 26 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-06177.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-02128,
  author       = {Philip Paquette and
                  Yuchen Lu and
                  Steven Bocco and
                  Max O. Smith and
                  Satya Ortiz{-}Gagne and
                  Jonathan K. Kummerfeld and
                  Satinder Singh and
                  Joelle Pineau and
                  Aaron C. Courville},
  title        = {No Press Diplomacy: Modeling Multi-Agent Gameplay},
  journal      = {CoRR},
  volume       = {abs/1909.02128},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.02128},
  eprinttype    = {arXiv},
  eprint       = {1909.02128},
  timestamp    = {Thu, 21 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-02128.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-07543,
  author       = {Thang Doan and
                  Bogdan Mazoure and
                  Audrey Durand and
                  Joelle Pineau and
                  R. Devon Hjelm},
  title        = {Attraction-Repulsion Actor-Critic for Continuous Control Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1909.07543},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.07543},
  eprinttype    = {arXiv},
  eprint       = {1909.07543},
  timestamp    = {Mon, 23 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-07543.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-01708,
  author       = {Scott Fujimoto and
                  Edoardo Conti and
                  Mohammad Ghavamzadeh and
                  Joelle Pineau},
  title        = {Benchmarking Batch Deep Reinforcement Learning Algorithms},
  journal      = {CoRR},
  volume       = {abs/1910.01708},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.01708},
  eprinttype    = {arXiv},
  eprint       = {1910.01708},
  timestamp    = {Wed, 09 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-01708.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-01741,
  author       = {Denis Yarats and
                  Amy Zhang and
                  Ilya Kostrikov and
                  Brandon Amos and
                  Joelle Pineau and
                  Rob Fergus},
  title        = {Improving Sample Efficiency in Model-Free Reinforcement Learning from
                  Images},
  journal      = {CoRR},
  volume       = {abs/1910.01741},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.01741},
  eprinttype    = {arXiv},
  eprint       = {1910.01741},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-01741.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-04054,
  author       = {Viswanath Sivakumar and
                  Tim Rockt{\"{a}}schel and
                  Alexander H. Miller and
                  Heinrich K{\"{u}}ttler and
                  Nantas Nardelli and
                  Mike Rabbat and
                  Joelle Pineau and
                  Sebastian Riedel},
  title        = {{MVFST-RL:} An Asynchronous {RL} Framework for Congestion Control
                  with Delayed Actions},
  journal      = {CoRR},
  volume       = {abs/1910.04054},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.04054},
  eprinttype    = {arXiv},
  eprint       = {1910.04054},
  timestamp    = {Wed, 16 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-04054.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-08019,
  author       = {Lucas Caccia and
                  Eugene Belilovsky and
                  Massimo Caccia and
                  Joelle Pineau},
  title        = {Online Learned Continual Compression with Stacked Quantization Module},
  journal      = {CoRR},
  volume       = {abs/1911.08019},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.08019},
  eprinttype    = {arXiv},
  eprint       = {1911.08019},
  timestamp    = {Mon, 02 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-08019.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-09033,
  author       = {Eric Crawford and
                  Joelle Pineau},
  title        = {Exploiting Spatial Invariance for Scalable Unsupervised Object Tracking},
  journal      = {CoRR},
  volume       = {abs/1911.09033},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.09033},
  eprinttype    = {arXiv},
  eprint       = {1911.09033},
  timestamp    = {Tue, 03 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-09033.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/dad/SerbanLHCP18,
  author       = {Iulian Vlad Serban and
                  Ryan Lowe and
                  Peter Henderson and
                  Laurent Charlin and
                  Joelle Pineau},
  title        = {A Survey of Available Corpora For Building Data-Driven Dialogue Systems:
                  The Journal Version},
  journal      = {Dialogue Discourse},
  volume       = {9},
  number       = {1},
  pages        = {1--49},
  year         = {2018},
  url          = {http://dad.uni-bielefeld.de/index.php/dad/article/view/3690},
  timestamp    = {Wed, 20 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/dad/SerbanLHCP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ftml/Francois-LavetH18,
  author       = {Vincent Fran{\c{c}}ois{-}Lavet and
                  Peter Henderson and
                  Riashat Islam and
                  Marc G. Bellemare and
                  Joelle Pineau},
  title        = {An Introduction to Deep Reinforcement Learning},
  journal      = {Found. Trends Mach. Learn.},
  volume       = {11},
  number       = {3-4},
  pages        = {219--354},
  year         = {2018},
  url          = {https://doi.org/10.1561/2200000071},
  doi          = {10.1561/2200000071},
  timestamp    = {Thu, 18 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ftml/Francois-LavetH18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijsr/GhorbelPGJS18,
  author       = {Mahmoud Ghorbel and
                  Joelle Pineau and
                  Richard Gourdeau and
                  Shervin Javdani and
                  Siddhartha S. Srinivasa},
  title        = {A Decision-Theoretic Approach for the Collaborative Control of a Smart
                  Wheelchair},
  journal      = {Int. J. Soc. Robotics},
  volume       = {10},
  number       = {1},
  pages        = {131--145},
  year         = {2018},
  url          = {https://doi.org/10.1007/s12369-017-0434-7},
  doi          = {10.1007/S12369-017-0434-7},
  timestamp    = {Fri, 25 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijsr/GhorbelPGJS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/DurandMP18,
  author       = {Audrey Durand and
                  Odalric{-}Ambrym Maillard and
                  Joelle Pineau},
  title        = {Streaming kernel regression with provably adaptive mean, variance,
                  and regularization},
  journal      = {J. Mach. Learn. Res.},
  volume       = {19},
  pages        = {17:1--17:34},
  year         = {2018},
  url          = {https://jmlr.org/papers/v19/17-404.html},
  timestamp    = {Wed, 11 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/DurandMP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/0002CBMPP18,
  author       = {Peter Henderson and
                  Wei{-}Di Chang and
                  Pierre{-}Luc Bacon and
                  David Meger and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {OptionGAN: Learning Joint Reward-Policy Options Using Generative Adversarial
                  Inverse Reinforcement Learning},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {3199--3206},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11775},
  doi          = {10.1609/AAAI.V32I1.11775},
  timestamp    = {Sat, 21 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/0002CBMPP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/0002IBPPM18,
  author       = {Peter Henderson and
                  Riashat Islam and
                  Philip Bachman and
                  Joelle Pineau and
                  Doina Precup and
                  David Meger},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Deep Reinforcement Learning That Matters},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {3207--3214},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11694},
  doi          = {10.1609/AAAI.V32I1.11694},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/0002IBPPM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aies/0002SAKFLP18,
  author       = {Peter Henderson and
                  Koustuv Sinha and
                  Nicolas Angelard{-}Gontier and
                  Nan Rosemary Ke and
                  Genevieve Fried and
                  Ryan Lowe and
                  Joelle Pineau},
  editor       = {Jason Furman and
                  Gary E. Marchant and
                  Huw Price and
                  Francesca Rossi},
  title        = {Ethical Challenges in Data-Driven Dialogue Systems},
  booktitle    = {Proceedings of the 2018 {AAAI/ACM} Conference on AI, Ethics, and Society,
                  {AIES} 2018, New Orleans, LA, USA, February 02-03, 2018},
  pages        = {123--129},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3278721.3278777},
  doi          = {10.1145/3278721.3278777},
  timestamp    = {Tue, 23 Jan 2024 13:25:45 +0100},
  biburl       = {https://dblp.org/rec/conf/aies/0002SAKFLP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/Romoff0PFP18,
  author       = {Joshua Romoff and
                  Peter Henderson and
                  Alexandre Pich{\'{e}} and
                  Vincent Fran{\c{c}}ois{-}Lavet and
                  Joelle Pineau},
  title        = {Reward Estimation for Variance Reduction in Deep Reinforcement Learning},
  booktitle    = {2nd Annual Conference on Robot Learning, CoRL 2018, Z{\"{u}}rich,
                  Switzerland, 29-31 October 2018, Proceedings},
  series       = {Proceedings of Machine Learning Research},
  volume       = {87},
  pages        = {674--699},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v87/romoff18a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:24 +0200},
  biburl       = {https://dblp.org/rec/conf/corl/Romoff0PFP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ParthasarathiP18,
  author       = {Prasanna Parthasarathi and
                  Joelle Pineau},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Extending Neural Generative Conversational Model using External Knowledge
                  Sources},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {690--695},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1073},
  doi          = {10.18653/V1/D18-1073},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ParthasarathiP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/RomoffP0FP18,
  author       = {Joshua Romoff and
                  Alexandre Pich{\'{e}} and
                  Peter Henderson and
                  Vincent Fran{\c{c}}ois{-}Lavet and
                  Joelle Pineau},
  title        = {Reward Estimation for Variance Reduction in Deep Reinforcement Learning},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=r1vcHYJvM},
  timestamp    = {Thu, 04 Apr 2019 13:20:09 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/RomoffP0FP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhangSP18,
  author       = {Amy Zhang and
                  Harsh Satija and
                  Joelle Pineau},
  title        = {Decoupling Dynamics and Reward for Transfer Learning},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=H1aoddyvM},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhangSP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KeZSLTBPCP18,
  author       = {Nan Rosemary Ke and
                  Konrad Zolna and
                  Alessandro Sordoni and
                  Zhouhan Lin and
                  Adam Trischler and
                  Yoshua Bengio and
                  Joelle Pineau and
                  Laurent Charlin and
                  Christopher J. Pal},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {Focused Hierarchical RNNs for Conditional Sequence Processing},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {2559--2568},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/ke18a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:30 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KeZSLTBPCP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/SmithHP18,
  author       = {Matthew J. A. Smith and
                  Herke van Hoof and
                  Joelle Pineau},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {An Inference-Based Policy Gradient Method for Learning Options},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {4710--4719},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/smith18a.html},
  timestamp    = {Thu, 07 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/SmithHP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlhc/DurandAISMP18,
  author       = {Audrey Durand and
                  Charis Achilleos and
                  Demetris Iacovides and
                  Katerina Strati and
                  Georgios D. Mitsis and
                  Joelle Pineau},
  editor       = {Finale Doshi{-}Velez and
                  Jim Fackler and
                  Ken Jung and
                  David C. Kale and
                  Rajesh Ranganath and
                  Byron C. Wallace and
                  Jenna Wiens},
  title        = {Contextual Bandits for Adapting Treatment in a Mouse Model of de Novo
                  Carcinogenesis},
  booktitle    = {Proceedings of the Machine Learning for Healthcare Conference, {MLHC}
                  2018, 17-18 August 2018, Palo Alto, California},
  series       = {Proceedings of Machine Learning Research},
  volume       = {85},
  pages        = {67--82},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v85/durand18a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:31 +0200},
  biburl       = {https://dblp.org/rec/conf/mlhc/DurandAISMP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ThodoroffDPP18,
  author       = {Pierre Thodoroff and
                  Audrey Durand and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Temporal Regularization for Markov Decision Process},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {1784--1794},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/4b0250793549726d5c1ea3906726ebfe-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ThodoroffDPP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-06700,
  author       = {Iulian Vlad Serban and
                  Chinnadhurai Sankar and
                  Mathieu Germain and
                  Saizheng Zhang and
                  Zhouhan Lin and
                  Sandeep Subramanian and
                  Taesup Kim and
                  Michael Pieper and
                  Sarath Chandar and
                  Nan Rosemary Ke and
                  Sai Rajeswar and
                  Alexandre de Br{\'{e}}bisson and
                  Jose M. R. Sotelo and
                  Dendi Suhubdy and
                  Vincent Michalski and
                  Alexandre Nguyen and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {A Deep Reinforcement Learning Chatbot (Short Version)},
  journal      = {CoRR},
  volume       = {abs/1801.06700},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.06700},
  eprinttype    = {arXiv},
  eprint       = {1801.06700},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-06700.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-09484,
  author       = {Valentin Thomas and
                  Emmanuel Bengio and
                  William Fedus and
                  Jules Pondard and
                  Philippe Beaudoin and
                  Hugo Larochelle and
                  Joelle Pineau and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Disentangling the independently controllable factors of variation
                  by interacting with the world},
  journal      = {CoRR},
  volume       = {abs/1802.09484},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.09484},
  eprinttype    = {arXiv},
  eprint       = {1802.09484},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-09484.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-10689,
  author       = {Amy Zhang and
                  Harsh Satija and
                  Joelle Pineau},
  title        = {Decoupling Dynamics and Reward for Transfer Learning},
  journal      = {CoRR},
  volume       = {abs/1804.10689},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.10689},
  eprinttype    = {arXiv},
  eprint       = {1804.10689},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-10689.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-03359,
  author       = {Joshua Romoff and
                  Alexandre Pich{\'{e}} and
                  Peter Henderson and
                  Vincent Fran{\c{c}}ois{-}Lavet and
                  Joelle Pineau},
  title        = {Reward Estimation for Variance Reduction in Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1805.03359},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.03359},
  eprinttype    = {arXiv},
  eprint       = {1805.03359},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-03359.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-02315,
  author       = {Ahmed Touati and
                  Harsh Satija and
                  Joshua Romoff and
                  Joelle Pineau and
                  Pascal Vincent},
  title        = {Randomized Value Functions via Multiplicative Normalizing Flows},
  journal      = {CoRR},
  volume       = {abs/1806.02315},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.02315},
  eprinttype    = {arXiv},
  eprint       = {1806.02315},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-02315.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-04342,
  author       = {Nan Rosemary Ke and
                  Konrad Zolna and
                  Alessandro Sordoni and
                  Zhouhan Lin and
                  Adam Trischler and
                  Yoshua Bengio and
                  Joelle Pineau and
                  Laurent Charlin and
                  Chris Pal},
  title        = {Focused Hierarchical RNNs for Conditional Sequence Processing},
  journal      = {CoRR},
  volume       = {abs/1806.04342},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.04342},
  eprinttype    = {arXiv},
  eprint       = {1806.04342},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-04342.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-07937,
  author       = {Amy Zhang and
                  Nicolas Ballas and
                  Joelle Pineau},
  title        = {A Dissection of Overfitting and Generalization in Continuous Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1806.07937},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.07937},
  eprinttype    = {arXiv},
  eprint       = {1806.07937},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-07937.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-04723,
  author       = {Iulian Vlad Serban and
                  Chinnadhurai Sankar and
                  Michael Pieper and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {The Bottleneck Simulator: {A} Model-based Deep Reinforcement Learning
                  Approach},
  journal      = {CoRR},
  volume       = {abs/1807.04723},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.04723},
  eprinttype    = {arXiv},
  eprint       = {1807.04723},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-04723.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-00020,
  author       = {Thang Doan and
                  Jo{\~{a}}o Monteiro and
                  Isabela Albuquerque and
                  Bogdan Mazoure and
                  Audrey Durand and
                  Joelle Pineau and
                  R. Devon Hjelm},
  title        = {Online Adaptative Curriculum Learning for GANs},
  journal      = {CoRR},
  volume       = {abs/1808.00020},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.00020},
  eprinttype    = {arXiv},
  eprint       = {1808.00020},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-00020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-04506,
  author       = {Vincent Fran{\c{c}}ois{-}Lavet and
                  Yoshua Bengio and
                  Doina Precup and
                  Joelle Pineau},
  title        = {Combined Reinforcement Learning via Abstract Representations},
  journal      = {CoRR},
  volume       = {abs/1809.04506},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.04506},
  eprinttype    = {arXiv},
  eprint       = {1809.04506},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-04506.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-04988,
  author       = {Eric Crawford and
                  Guillaume Rabusseau and
                  Joelle Pineau},
  title        = {Sequential Coordination of Deep Models for Learning Visual Arithmetic},
  journal      = {CoRR},
  volume       = {abs/1809.04988},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.04988},
  eprinttype    = {arXiv},
  eprint       = {1809.04988},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-04988.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-05524,
  author       = {Prasanna Parthasarathi and
                  Joelle Pineau},
  title        = {Extending Neural Generative Conversational Model using External Knowledge
                  Sources},
  journal      = {CoRR},
  volume       = {abs/1809.05524},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.05524},
  eprinttype    = {arXiv},
  eprint       = {1809.05524},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-05524.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-02525,
  author       = {Peter Henderson and
                  Joshua Romoff and
                  Joelle Pineau},
  title        = {Where Did My Optimum Go?: An Empirical Analysis of Gradient Descent
                  Optimization in Policy Gradient Methods},
  journal      = {CoRR},
  volume       = {abs/1810.02525},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.02525},
  eprinttype    = {arXiv},
  eprint       = {1810.02525},
  timestamp    = {Tue, 30 Oct 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-02525.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-11187,
  author       = {Abhishek Das and
                  Th{\'{e}}ophile Gervet and
                  Joshua Romoff and
                  Dhruv Batra and
                  Devi Parikh and
                  Michael G. Rabbat and
                  Joelle Pineau},
  title        = {TarMAC: Targeted Multi-Agent Communication},
  journal      = {CoRR},
  volume       = {abs/1810.11187},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.11187},
  eprinttype    = {arXiv},
  eprint       = {1810.11187},
  timestamp    = {Mon, 09 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-11187.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-00429,
  author       = {Pierre Thodoroff and
                  Audrey Durand and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Temporal Regularization in Markov Decision Process},
  journal      = {CoRR},
  volume       = {abs/1811.00429},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.00429},
  eprinttype    = {arXiv},
  eprint       = {1811.00429},
  timestamp    = {Thu, 22 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-00429.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-01302,
  author       = {Peter Henderson and
                  Koustuv Sinha and
                  Nan Rosemary Ke and
                  Joelle Pineau},
  title        = {Adversarial Gain},
  journal      = {CoRR},
  volume       = {abs/1811.01302},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.01302},
  eprinttype    = {arXiv},
  eprint       = {1811.01302},
  timestamp    = {Thu, 22 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-01302.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-02549,
  author       = {Massimo Caccia and
                  Lucas Caccia and
                  William Fedus and
                  Hugo Larochelle and
                  Joelle Pineau and
                  Laurent Charlin},
  title        = {Language GANs Falling Short},
  journal      = {CoRR},
  volume       = {abs/1811.02549},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.02549},
  eprinttype    = {arXiv},
  eprint       = {1811.02549},
  timestamp    = {Thu, 22 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-02549.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-02714,
  author       = {Nicolas Gontier and
                  Koustuv Sinha and
                  Peter Henderson and
                  Iulian Serban and
                  Michael Noseworthy and
                  Prasanna Parthasarathi and
                  Joelle Pineau},
  title        = {The RLLChatbot: a solution to the ConvAI challenge},
  journal      = {CoRR},
  volume       = {abs/1811.02714},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.02714},
  eprinttype    = {arXiv},
  eprint       = {1811.02714},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-02714.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-02959,
  author       = {Koustuv Sinha and
                  Shagun Sodhani and
                  William L. Hamilton and
                  Joelle Pineau},
  title        = {Compositional Language Understanding with Text-based Relational Reasoning},
  journal      = {CoRR},
  volume       = {abs/1811.02959},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.02959},
  eprinttype    = {arXiv},
  eprint       = {1811.02959},
  timestamp    = {Thu, 22 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-02959.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-06032,
  author       = {Amy Zhang and
                  Yuxin Wu and
                  Joelle Pineau},
  title        = {Natural Environment Benchmarks for Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1811.06032},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.06032},
  eprinttype    = {arXiv},
  eprint       = {1811.06032},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-06032.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-12560,
  author       = {Vincent Fran{\c{c}}ois{-}Lavet and
                  Peter Henderson and
                  Riashat Islam and
                  Marc G. Bellemare and
                  Joelle Pineau},
  title        = {An Introduction to Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1811.12560},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.12560},
  eprinttype    = {arXiv},
  eprint       = {1811.12560},
  timestamp    = {Mon, 03 Dec 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-12560.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-01180,
  author       = {Lucas Caccia and
                  Herke van Hoof and
                  Aaron C. Courville and
                  Joelle Pineau},
  title        = {Deep Generative Modeling of LiDAR Data},
  journal      = {CoRR},
  volume       = {abs/1812.01180},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.01180},
  eprinttype    = {arXiv},
  eprint       = {1812.01180},
  timestamp    = {Tue, 01 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-01180.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/dad/LowePSCLP17,
  author       = {Ryan Thomas Lowe and
                  Nissan Pow and
                  Iulian Vlad Serban and
                  Laurent Charlin and
                  Chia{-}Wei Liu and
                  Joelle Pineau},
  title        = {Training End-to-End Dialogue Systems with the Ubuntu Dialogue Corpus},
  journal      = {Dialogue Discourse},
  volume       = {8},
  number       = {1},
  pages        = {31--65},
  year         = {2017},
  url          = {http://dad.uni-bielefeld.de/index.php/dad/article/view/3698},
  timestamp    = {Wed, 20 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/dad/LowePSCLP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/titb/EmamiYRPCH17,
  author       = {Ali Emami and
                  Joseph El Youssef and
                  Remi Rabasa{-}Lhoret and
                  Joelle Pineau and
                  Jessica R. Castle and
                  Ahmad Haidar},
  title        = {Modeling Glucagon Action in Patients With Type 1 Diabetes},
  journal      = {{IEEE} J. Biomed. Health Informatics},
  volume       = {21},
  number       = {4},
  pages        = {1163--1171},
  year         = {2017},
  url          = {https://doi.org/10.1109/JBHI.2016.2593630},
  doi          = {10.1109/JBHI.2016.2593630},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/titb/EmamiYRPCH17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SerbanSLCPCB17,
  author       = {Iulian Vlad Serban and
                  Alessandro Sordoni and
                  Ryan Lowe and
                  Laurent Charlin and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {A Hierarchical Latent Variable Encoder-Decoder Model for Generating
                  Dialogues},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {3295--3301},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.10983},
  doi          = {10.1609/AAAI.V31I1.10983},
  timestamp    = {Mon, 04 Sep 2023 14:40:32 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SerbanSLCPCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LoweNSABP17,
  author       = {Ryan Lowe and
                  Michael Noseworthy and
                  Iulian Vlad Serban and
                  Nicolas Angelard{-}Gontier and
                  Yoshua Bengio and
                  Joelle Pineau},
  editor       = {Regina Barzilay and
                  Min{-}Yen Kan},
  title        = {Towards an Automatic Turing Test: Learning to Evaluate Dialogue Responses},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
                  1: Long Papers},
  pages        = {1116--1126},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-1103},
  doi          = {10.18653/V1/P17-1103},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LoweNSABP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ai/SmithCP17,
  author       = {Matthew Smith and
                  Laurent Charlin and
                  Joelle Pineau},
  editor       = {Malek Mouhoub and
                  Philippe Langlais},
  title        = {A Sparse Probabilistic Model of User Preference Data},
  booktitle    = {Advances in Artificial Intelligence - 30th Canadian Conference on
                  Artificial Intelligence, Canadian {AI} 2017, Edmonton, AB, Canada,
                  May 16-19, 2017, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {10233},
  pages        = {316--328},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-57351-9\_36},
  doi          = {10.1007/978-3-319-57351-9\_36},
  timestamp    = {Thu, 28 Sep 2023 12:27:16 +0200},
  biburl       = {https://dblp.org/rec/conf/ai/SmithCP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SerbanOPC17a,
  author       = {Iulian Vlad Serban and
                  Alexander Ororbia and
                  Joelle Pineau and
                  Aaron C. Courville},
  editor       = {Kai{-}Wei Chang and
                  Ming{-}Wei Chang and
                  Vivek Srikumar and
                  Alexander M. Rush},
  title        = {Piecewise Latent Variables for Neural Variational Text Processing},
  booktitle    = {Proceedings of the 2nd Workshop on Structured Prediction for Natural
                  Language Processing, SPNLP@EMNLP, Copenhagen, Denmark, September 2017},
  pages        = {52--62},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/w17-4308},
  doi          = {10.18653/V1/W17-4308},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SerbanOPC17a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SerbanOPC17,
  author       = {Iulian Vlad Serban and
                  Alexander G. Ororbia II and
                  Joelle Pineau and
                  Aaron C. Courville},
  editor       = {Martha Palmer and
                  Rebecca Hwa and
                  Sebastian Riedel},
  title        = {Piecewise Latent Variables for Neural Variational Text Processing},
  booktitle    = {Proceedings of the 2017 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2017, Copenhagen, Denmark, September
                  9-11, 2017},
  pages        = {422--432},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/d17-1043},
  doi          = {10.18653/V1/D17-1043},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SerbanOPC17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BahdanauBXGLPCB17,
  author       = {Dzmitry Bahdanau and
                  Philemon Brakel and
                  Kelvin Xu and
                  Anirudh Goyal and
                  Ryan Lowe and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {An Actor-Critic Algorithm for Sequence Prediction},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=SJDaqqveg},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BahdanauBXGLPCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LoweNSABP17,
  author       = {Ryan Lowe and
                  Michael Noseworthy and
                  Iulian Vlad Serban and
                  Nicolas Angelard{-}Gontier and
                  Yoshua Bengio and
                  Joelle Pineau},
  title        = {Towards an automatic Turing test: Learning to evaluate dialogue responses},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=Sk7c3yVYg},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LoweNSABP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RabusseauBP17,
  author       = {Guillaume Rabusseau and
                  Borja Balle and
                  Joelle Pineau},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Multitask Spectral Learning of Weighted Automata},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {2588--2597},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/e655c7716a4b3ea67f48c6322fc42ed6-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 13:58:27 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/RabusseauBP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigdial/TruongPP17,
  author       = {Hoai Phuoc Truong and
                  Prasanna Parthasarathi and
                  Joelle Pineau},
  editor       = {Kristiina Jokinen and
                  Manfred Stede and
                  David DeVault and
                  Annie Louis},
  title        = {{MACA:} {A} Modular Architecture for Conversational Agents},
  booktitle    = {Proceedings of the 18th Annual SIGdial Meeting on Discourse and Dialogue,
                  Saarbr{\"{u}}cken, Germany, August 15-17, 2017},
  pages        = {93--102},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/w17-5513},
  doi          = {10.18653/V1/W17-5513},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigdial/TruongPP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigdial/NoseworthyCP17,
  author       = {Michael Noseworthy and
                  Jackie Chi Kit Cheung and
                  Joelle Pineau},
  editor       = {Kristiina Jokinen and
                  Manfred Stede and
                  David DeVault and
                  Annie Louis},
  title        = {Predicting Success in Goal-Driven Human-Human Dialogues},
  booktitle    = {Proceedings of the 18th Annual SIGdial Meeting on Discourse and Dialogue,
                  Saarbr{\"{u}}cken, Germany, August 15-17, 2017},
  pages        = {253--262},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/w17-5531},
  doi          = {10.18653/V1/W17-5531},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigdial/NoseworthyCP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioTPPB17,
  author       = {Emmanuel Bengio and
                  Valentin Thomas and
                  Joelle Pineau and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Independently Controllable Features},
  journal      = {CoRR},
  volume       = {abs/1703.07718},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.07718},
  eprinttype    = {arXiv},
  eprint       = {1703.07718},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioTPPB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-00768,
  author       = {Audrey Durand and
                  Odalric{-}Ambrym Maillard and
                  Joelle Pineau},
  title        = {Streaming kernel regression with provably adaptive mean, variance,
                  and regularization},
  journal      = {CoRR},
  volume       = {abs/1708.00768},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.00768},
  eprinttype    = {arXiv},
  eprint       = {1708.00768},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-00768.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-01289,
  author       = {Valentin Thomas and
                  Jules Pondard and
                  Emmanuel Bengio and
                  Marc Sarfati and
                  Philippe Beaudoin and
                  Marie{-}Jean Meurs and
                  Joelle Pineau and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Independently Controllable Factors},
  journal      = {CoRR},
  volume       = {abs/1708.01289},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.01289},
  eprinttype    = {arXiv},
  eprint       = {1708.01289},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-01289.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-07149,
  author       = {Ryan Lowe and
                  Michael Noseworthy and
                  Iulian Vlad Serban and
                  Nicolas Angelard{-}Gontier and
                  Yoshua Bengio and
                  Joelle Pineau},
  title        = {Towards an Automatic Turing Test: Learning to Evaluate Dialogue Responses},
  journal      = {CoRR},
  volume       = {abs/1708.07149},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.07149},
  eprinttype    = {arXiv},
  eprint       = {1708.07149},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-07149.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-02349,
  author       = {Iulian Vlad Serban and
                  Chinnadhurai Sankar and
                  Mathieu Germain and
                  Saizheng Zhang and
                  Zhouhan Lin and
                  Sandeep Subramanian and
                  Taesup Kim and
                  Michael Pieper and
                  Sarath Chandar and
                  Nan Rosemary Ke and
                  Sai Mudumba and
                  Alexandre de Br{\'{e}}bisson and
                  Jose Sotelo and
                  Dendi Suhubdy and
                  Vincent Michalski and
                  Alexandre Nguyen and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {A Deep Reinforcement Learning Chatbot},
  journal      = {CoRR},
  volume       = {abs/1709.02349},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.02349},
  eprinttype    = {arXiv},
  eprint       = {1709.02349},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-02349.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-06560,
  author       = {Peter Henderson and
                  Riashat Islam and
                  Philip Bachman and
                  Joelle Pineau and
                  Doina Precup and
                  David Meger},
  title        = {Deep Reinforcement Learning that Matters},
  journal      = {CoRR},
  volume       = {abs/1709.06560},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.06560},
  eprinttype    = {arXiv},
  eprint       = {1709.06560},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-06560.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-06683,
  author       = {Peter Henderson and
                  Wei{-}Di Chang and
                  Pierre{-}Luc Bacon and
                  David Meger and
                  Joelle Pineau and
                  Doina Precup},
  title        = {OptionGAN: Learning Joint Reward-Policy Options using Generative Adversarial
                  Inverse Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1709.06683},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.06683},
  eprinttype    = {arXiv},
  eprint       = {1709.06683},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-06683.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-04755,
  author       = {Anirudh Goyal and
                  Nan Rosemary Ke and
                  Alex Lamb and
                  R. Devon Hjelm and
                  Chris Pal and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {ACtuAL: Actor-Critic Under Adversarial Learning},
  journal      = {CoRR},
  volume       = {abs/1711.04755},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.04755},
  eprinttype    = {arXiv},
  eprint       = {1711.04755},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-04755.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-09050,
  author       = {Peter Henderson and
                  Koustuv Sinha and
                  Nicolas Angelard{-}Gontier and
                  Nan Rosemary Ke and
                  Genevieve Fried and
                  Ryan Lowe and
                  Joelle Pineau},
  title        = {Ethical Challenges in Data-Driven Dialogue Systems},
  journal      = {CoRR},
  volume       = {abs/1711.09050},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.09050},
  eprinttype    = {arXiv},
  eprint       = {1711.09050},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-09050.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-09520,
  author       = {Xingwei Cao and
                  Guillaume Rabusseau and
                  Joelle Pineau},
  title        = {Tensor Regression Networks with various Low-Rank Tensor Approximations},
  journal      = {CoRR},
  volume       = {abs/1712.09520},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.09520},
  eprinttype    = {arXiv},
  eprint       = {1712.09520},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-09520.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijsr/KimP16,
  author       = {Beomjoon Kim and
                  Joelle Pineau},
  title        = {Socially Adaptive Path Planning in Human Environments Using Inverse
                  Reinforcement Learning},
  journal      = {Int. J. Soc. Robotics},
  volume       = {8},
  number       = {1},
  pages        = {51--66},
  year         = {2016},
  url          = {https://doi.org/10.1007/s12369-015-0310-2},
  doi          = {10.1007/S12369-015-0310-2},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijsr/KimP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/BarretoPP16,
  author       = {Andr{\'{e}} da Motta Salles Barreto and
                  Doina Precup and
                  Joelle Pineau},
  title        = {Practical Kernel-Based Reinforcement Learning},
  journal      = {J. Mach. Learn. Res.},
  volume       = {17},
  pages        = {67:1--67:70},
  year         = {2016},
  url          = {https://jmlr.org/papers/v17/13-134.html},
  timestamp    = {Wed, 11 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BarretoPP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tkde/WangP16,
  author       = {Boyu Wang and
                  Joelle Pineau},
  title        = {Online Bagging and Boosting for Imbalanced Data Streams},
  journal      = {{IEEE} Trans. Knowl. Data Eng.},
  volume       = {28},
  number       = {12},
  pages        = {3353--3366},
  year         = {2016},
  url          = {https://doi.org/10.1109/TKDE.2016.2609424},
  doi          = {10.1109/TKDE.2016.2609424},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tkde/WangP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/BarretoBPP16,
  author       = {Andr{\'{e}} da Motta Salles Barreto and
                  Rafael L. Beirigo and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Dale Schuurmans and
                  Michael P. Wellman},
  title        = {Incremental Stochastic Factorization for Online Reinforcement Learning},
  booktitle    = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence,
                  February 12-17, 2016, Phoenix, Arizona, {USA}},
  pages        = {1468--1475},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {https://doi.org/10.1609/aaai.v30i1.10311},
  doi          = {10.1609/AAAI.V30I1.10311},
  timestamp    = {Mon, 04 Sep 2023 15:08:28 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/BarretoBPP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WangPB16,
  author       = {Boyu Wang and
                  Joelle Pineau and
                  Borja Balle},
  editor       = {Dale Schuurmans and
                  Michael P. Wellman},
  title        = {Multitask Generalized Eigenvalue Program},
  booktitle    = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence,
                  February 12-17, 2016, Phoenix, Arizona, {USA}},
  pages        = {2115--2121},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {https://doi.org/10.1609/aaai.v30i1.10229},
  doi          = {10.1609/AAAI.V30I1.10229},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WangPB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SerbanSBCP16,
  author       = {Iulian Vlad Serban and
                  Alessandro Sordoni and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Joelle Pineau},
  editor       = {Dale Schuurmans and
                  Michael P. Wellman},
  title        = {Building End-To-End Dialogue Systems Using Generative Hierarchical
                  Neural Network Models},
  booktitle    = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence,
                  February 12-17, 2016, Phoenix, Arizona, {USA}},
  pages        = {3776--3784},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {https://doi.org/10.1609/aaai.v30i1.9883},
  doi          = {10.1609/AAAI.V30I1.9883},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SerbanSBCP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/GerdzhevPMVF16,
  author       = {Martin Gerdzhev and
                  Joelle Pineau and
                  Ian M. Mitchell and
                  Pooja Viswanathan and
                  Genevi{\`{e}}ve Foley},
  title        = {On the Use of Modular Software and Hardware for Designing Wheelchair
                  Robots},
  booktitle    = {2016 {AAAI} Spring Symposia, Stanford University, Palo Alto, California,
                  USA, March 21-23, 2016},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {http://www.aaai.org/ocs/index.php/SSS/SSS16/paper/view/12704},
  timestamp    = {Wed, 14 Nov 2018 13:16:02 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/GerdzhevPMVF16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/LiuLSNCP16,
  author       = {Chia{-}Wei Liu and
                  Ryan Lowe and
                  Iulian Serban and
                  Michael Noseworthy and
                  Laurent Charlin and
                  Joelle Pineau},
  editor       = {Jian Su and
                  Xavier Carreras and
                  Kevin Duh},
  title        = {How {NOT} To Evaluate Your Dialogue System: An Empirical Study of
                  Unsupervised Evaluation Metrics for Dialogue Response Generation},
  booktitle    = {Proceedings of the 2016 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4,
                  2016},
  pages        = {2122--2132},
  publisher    = {The Association for Computational Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/d16-1230},
  doi          = {10.18653/V1/D16-1230},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/LiuLSNCP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/ZhouBP16,
  author       = {Chenghui Zhou and
                  Borja Balle and
                  Joelle Pineau},
  editor       = {Danica Kragic and
                  Antonio Bicchi and
                  Alessandro De Luca},
  title        = {Learning time series models for pedestrian motion prediction},
  booktitle    = {2016 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2016, Stockholm, Sweden, May 16-21, 2016},
  pages        = {3323--3330},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICRA.2016.7487506},
  doi          = {10.1109/ICRA.2016.7487506},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/ZhouBP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/WangP16,
  author       = {Boyu Wang and
                  Joelle Pineau},
  editor       = {Subbarao Kambhampati},
  title        = {Generalized Dictionary for Multitask Learning with Boosting},
  booktitle    = {Proceedings of the Twenty-Fifth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July
                  2016},
  pages        = {2097--2103},
  publisher    = {{IJCAI/AAAI} Press},
  year         = {2016},
  url          = {http://www.ijcai.org/Abstract/16/299},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/WangP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlhc/ThodoroffPL16,
  author       = {Pierre Thodoroff and
                  Joelle Pineau and
                  Andrew Lim},
  editor       = {Finale Doshi{-}Velez and
                  Jim Fackler and
                  David C. Kale and
                  Byron C. Wallace and
                  Jenna Wiens},
  title        = {Learning Robust Features using Deep Learning for Automatic Seizure
                  Detection},
  booktitle    = {Proceedings of the 1st Machine Learning in Health Care, {MLHC} 2016,
                  Los Angeles, CA, USA, August 19-20, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {56},
  pages        = {178--190},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v56/Thodoroff16.html},
  timestamp    = {Wed, 17 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mlhc/ThodoroffPL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigdial/LoweSNCP16,
  author       = {Ryan Lowe and
                  Iulian Vlad Serban and
                  Michael Noseworthy and
                  Laurent Charlin and
                  Joelle Pineau},
  title        = {On the Evaluation of Dialogue Systems with Next Utterance Classification},
  booktitle    = {Proceedings of the {SIGDIAL} 2016 Conference, The 17th Annual Meeting
                  of the Special Interest Group on Discourse and Dialogue, 13-15 September
                  2016, Los Angeles, CA, {USA}},
  pages        = {264--269},
  publisher    = {The Association for Computer Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/w16-3634},
  doi          = {10.18653/V1/W16-3634},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigdial/LoweSNCP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LiuLSNCP16,
  author       = {Chia{-}Wei Liu and
                  Ryan Lowe and
                  Iulian Vlad Serban and
                  Michael Noseworthy and
                  Laurent Charlin and
                  Joelle Pineau},
  title        = {How {NOT} To Evaluate Your Dialogue System: An Empirical Study of
                  Unsupervised Evaluation Metrics for Dialogue Response Generation},
  journal      = {CoRR},
  volume       = {abs/1603.08023},
  year         = {2016},
  url          = {http://arxiv.org/abs/1603.08023},
  eprinttype    = {arXiv},
  eprint       = {1603.08023},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LiuLSNCP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LoweSNCP16,
  author       = {Ryan Lowe and
                  Iulian Vlad Serban and
                  Michael Noseworthy and
                  Laurent Charlin and
                  Joelle Pineau},
  title        = {On the Evaluation of Dialogue Systems with Next Utterance Classification},
  journal      = {CoRR},
  volume       = {abs/1605.05414},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.05414},
  eprinttype    = {arXiv},
  eprint       = {1605.05414},
  timestamp    = {Thu, 13 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LoweSNCP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanSLCPCB16,
  author       = {Iulian Vlad Serban and
                  Alessandro Sordoni and
                  Ryan Lowe and
                  Laurent Charlin and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {A Hierarchical Latent Variable Encoder-Decoder Model for Generating
                  Dialogues},
  journal      = {CoRR},
  volume       = {abs/1605.06069},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.06069},
  eprinttype    = {arXiv},
  eprint       = {1605.06069},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanSLCPCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauBXGLPCB16,
  author       = {Dzmitry Bahdanau and
                  Philemon Brakel and
                  Kelvin Xu and
                  Anirudh Goyal and
                  Ryan Lowe and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {An Actor-Critic Algorithm for Sequence Prediction},
  journal      = {CoRR},
  volume       = {abs/1607.07086},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.07086},
  eprinttype    = {arXiv},
  eprint       = {1607.07086},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauBXGLPCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ThodoroffPL16,
  author       = {Pierre Thodoroff and
                  Joelle Pineau and
                  Andrew Lim},
  title        = {Learning Robust Features using Deep Learning for Automatic Seizure
                  Detection},
  journal      = {CoRR},
  volume       = {abs/1608.00220},
  year         = {2016},
  url          = {http://arxiv.org/abs/1608.00220},
  eprinttype    = {arXiv},
  eprint       = {1608.00220},
  timestamp    = {Wed, 17 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ThodoroffPL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GhavamzadehMPT16,
  author       = {Mohammad Ghavamzadeh and
                  Shie Mannor and
                  Joelle Pineau and
                  Aviv Tamar},
  title        = {Bayesian Reinforcement Learning: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/1609.04436},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.04436},
  eprinttype    = {arXiv},
  eprint       = {1609.04436},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GhavamzadehMPT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanLCP16,
  author       = {Iulian Vlad Serban and
                  Ryan Lowe and
                  Laurent Charlin and
                  Joelle Pineau},
  title        = {Generative Deep Neural Networks for Dialogue: {A} Short Review},
  journal      = {CoRR},
  volume       = {abs/1611.06216},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.06216},
  eprinttype    = {arXiv},
  eprint       = {1611.06216},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanLCP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanOPC16,
  author       = {Iulian Vlad Serban and
                  Alexander G. Ororbia II and
                  Joelle Pineau and
                  Aaron C. Courville},
  title        = {Multi-modal Variational Encoder-Decoders},
  journal      = {CoRR},
  volume       = {abs/1612.00377},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.00377},
  eprinttype    = {arXiv},
  eprint       = {1612.00377},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanOPC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ftml/GhavamzadehMPT15,
  author       = {Mohammad Ghavamzadeh and
                  Shie Mannor and
                  Joelle Pineau and
                  Aviv Tamar},
  title        = {Bayesian Reinforcement Learning: {A} Survey},
  journal      = {Found. Trends Mach. Learn.},
  volume       = {8},
  number       = {5-6},
  pages        = {359--483},
  year         = {2015},
  url          = {https://doi.org/10.1561/2200000049},
  doi          = {10.1561/2200000049},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ftml/GhavamzadehMPT15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WangP15,
  author       = {Boyu Wang and
                  Joelle Pineau},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {Online Boosting Algorithms for Anytime Transfer and Multitask Learning},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {3038--3044},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9607},
  doi          = {10.1609/AAAI.V29I1.9607},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WangP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MaP15,
  author       = {Hang Ma and
                  Joelle Pineau},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {Information Gathering and Reward Exploitation of Subgoals for POMDPs},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {3320--3326},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9659},
  doi          = {10.1609/AAAI.V29I1.9659},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/MaP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/DurandP15,
  author       = {Audrey Durand and
                  Joelle Pineau},
  title        = {Adaptive Treatment Allocation Using Sub-Sampled Gaussian Processes},
  booktitle    = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14,
                  2015},
  pages        = {9--11},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11671},
  timestamp    = {Wed, 14 Nov 2018 16:20:12 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaifs/DurandP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/SutcliffeTP15,
  author       = {Andrew Sutcliffe and
                  Neil A. Tenenholtz and
                  Joelle Pineau},
  title        = {Missteps in Robot Social Navigation},
  booktitle    = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14,
                  2015},
  pages        = {134--136},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11679},
  timestamp    = {Sun, 09 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaifs/SutcliffeTP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aips/Pineau15,
  author       = {Joelle Pineau},
  editor       = {Ronen I. Brafman and
                  Carmel Domshlak and
                  Patrik Haslum and
                  Shlomo Zilberstein},
  title        = {Improving the Design and Discovery of Dynamic Treatment Strategies
                  Using Recent Results in Sequential Decision-Making},
  booktitle    = {Proceedings of the Twenty-Fifth International Conference on Automated
                  Planning and Scheduling, {ICAPS} 2015, Jerusalem, Israel, June 7-11,
                  2015},
  pages        = {373},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://www.aaai.org/ocs/index.php/ICAPS/ICAPS15/paper/view/10637},
  timestamp    = {Tue, 26 May 2015 21:03:02 +0200},
  biburl       = {https://dblp.org/rec/conf/aips/Pineau15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PineauB15,
  author       = {Joelle Pineau and
                  Pierre{-}Luc Bacon},
  editor       = {Ioannis Katakis and
                  Fran{\c{c}}ois Schnitzler and
                  Thomas Liebig and
                  Dimitrios Gunopulos and
                  Katharina Morik and
                  Gennady L. Andrienko and
                  Shie Mannor},
  title        = {Analyzing Open Data from the City of Montreal},
  booktitle    = {Proceedings of the 2nd International Workshop on Mining Urban Data
                  co-located with 32nd International Conference on Machine Learning
                  {(ICML} 2015), Lille, France, July 11th, 2015},
  series       = {{CEUR} Workshop Proceedings},
  volume       = {1392},
  pages        = {11--16},
  publisher    = {CEUR-WS.org},
  year         = {2015},
  url          = {https://ceur-ws.org/Vol-1392/paper-02.pdf},
  timestamp    = {Fri, 10 Mar 2023 16:22:13 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/PineauB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/LeighPOZ15,
  author       = {Angus Leigh and
                  Joelle Pineau and
                  Nicolas A. Olmedo and
                  Hong Zhang},
  title        = {Person tracking and following with 2D laser scanners},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2015, Seattle, WA, USA, 26-30 May, 2015},
  pages        = {726--733},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICRA.2015.7139259},
  doi          = {10.1109/ICRA.2015.7139259},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/LeighPOZ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/BarretoBPP15,
  author       = {Andr{\'{e}} da Motta Salles Barreto and
                  Rafael L. Beirigo and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Qiang Yang and
                  Michael J. Wooldridge},
  title        = {An Expectation-Maximization Algorithm to Compute a Stochastic Factorization
                  From Data},
  booktitle    = {Proceedings of the Twenty-Fourth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2015, Buenos Aires, Argentina, July
                  25-31, 2015},
  pages        = {3329--3336},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://ijcai.org/Abstract/15/469},
  timestamp    = {Tue, 20 Aug 2019 16:16:43 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/BarretoBPP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/YuenPA15,
  author       = {HiuKim Yuen and
                  Joelle Pineau and
                  Philippe S. Archambault},
  title        = {Automatically characterizing driving activities onboard smart wheelchairs
                  from accelerometer data},
  booktitle    = {2015 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2015, Hamburg, Germany, September 28 - October 2,
                  2015},
  pages        = {5011--5018},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/IROS.2015.7354082},
  doi          = {10.1109/IROS.2015.7354082},
  timestamp    = {Fri, 26 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/YuenPA15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigdial/LowePSP15,
  author       = {Ryan Lowe and
                  Nissan Pow and
                  Iulian Serban and
                  Joelle Pineau},
  title        = {The Ubuntu Dialogue Corpus: {A} Large Dataset for Research in Unstructured
                  Multi-Turn Dialogue Systems},
  booktitle    = {Proceedings of the {SIGDIAL} 2015 Conference, The 16th Annual Meeting
                  of the Special Interest Group on Discourse and Dialogue, 2-4 September
                  2015, Prague, Czech Republic},
  pages        = {285--294},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.18653/v1/w15-4640},
  doi          = {10.18653/V1/W15-4640},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigdial/LowePSP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LowePSP15,
  author       = {Ryan Lowe and
                  Nissan Pow and
                  Iulian Serban and
                  Joelle Pineau},
  title        = {The Ubuntu Dialogue Corpus: {A} Large Dataset for Research in Unstructured
                  Multi-Turn Dialogue Systems},
  journal      = {CoRR},
  volume       = {abs/1506.08909},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.08909},
  eprinttype    = {arXiv},
  eprint       = {1506.08909},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LowePSP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanSBCP15,
  author       = {Iulian Vlad Serban and
                  Alessandro Sordoni and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Joelle Pineau},
  title        = {Hierarchical Neural Network Generative Models for Movie Dialogues},
  journal      = {CoRR},
  volume       = {abs/1507.04808},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.04808},
  eprinttype    = {arXiv},
  eprint       = {1507.04808},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanSBCP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioBPP15,
  author       = {Emmanuel Bengio and
                  Pierre{-}Luc Bacon and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Conditional Computation in Neural Networks for faster models},
  journal      = {CoRR},
  volume       = {abs/1511.06297},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.06297},
  eprinttype    = {arXiv},
  eprint       = {1511.06297},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/BengioBPP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanLCP15,
  author       = {Iulian Vlad Serban and
                  Ryan Lowe and
                  Peter Henderson and
                  Laurent Charlin and
                  Joelle Pineau},
  title        = {A Survey of Available Corpora for Building Data-Driven Dialogue Systems},
  journal      = {CoRR},
  volume       = {abs/1512.05742},
  year         = {2015},
  url          = {http://arxiv.org/abs/1512.05742},
  eprinttype    = {arXiv},
  eprint       = {1512.05742},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanLCP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/BarretoPP14,
  author       = {Andr{\'{e}} da Motta Salles Barreto and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Policy Iteration Based on Stochastic Factorization},
  journal      = {J. Artif. Intell. Res.},
  volume       = {50},
  pages        = {763--803},
  year         = {2014},
  url          = {https://doi.org/10.1613/jair.4301},
  doi          = {10.1613/JAIR.4301},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jair/BarretoPP14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/HamiltonFP14,
  author       = {William L. Hamilton and
                  Mahdi Milani Fard and
                  Joelle Pineau},
  title        = {Efficient learning and planning with compressed predictive states},
  journal      = {J. Mach. Learn. Res.},
  volume       = {15},
  number       = {1},
  pages        = {3395--3439},
  year         = {2014},
  url          = {https://dl.acm.org/doi/10.5555/2627435.2750354},
  doi          = {10.5555/2627435.2750354},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/HamiltonFP14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/SutcliffeGP14,
  author       = {Andrew Sutcliffe and
                  Daniel H. Grollman and
                  Joelle Pineau},
  title        = {Estimating People's Subjective Experiences of Robot Behavior},
  booktitle    = {2014 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 13-15,
                  2014},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {http://www.aaai.org/ocs/index.php/FSS/FSS14/paper/view/9148},
  timestamp    = {Wed, 14 Nov 2018 17:08:03 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaifs/SutcliffeGP14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BalleHP14,
  author       = {Borja Balle and
                  William L. Hamilton and
                  Joelle Pineau},
  title        = {Methods of Moments for Learning Stochastic Languages: Unified Presentation
                  and Empirical Comparison},
  booktitle    = {Proceedings of the 31th International Conference on Machine Learning,
                  {ICML} 2014, Beijing, China, 21-26 June 2014},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {32},
  pages        = {1386--1394},
  publisher    = {JMLR.org},
  year         = {2014},
  url          = {http://proceedings.mlr.press/v32/balle14.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/BalleHP14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/AlsharifP13,
  author       = {Ouais Alsharif and
                  Joelle Pineau},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {End-to-End Text Recognition with Hybrid {HMM} Maxout Models},
  booktitle    = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Workshop Track Proceedings},
  year         = {2014},
  url          = {http://arxiv.org/abs/1310.1811},
  timestamp    = {Thu, 04 Apr 2019 13:20:06 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AlsharifP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RossPPC14,
  author       = {St{\'{e}}phane Ross and
                  Joelle Pineau and
                  S{\'{e}}bastien Paquet and
                  Brahim Chaib{-}draa},
  title        = {Online Planning Algorithms for POMDPs},
  journal      = {CoRR},
  volume       = {abs/1401.3436},
  year         = {2014},
  url          = {http://arxiv.org/abs/1401.3436},
  eprinttype    = {arXiv},
  eprint       = {1401.3436},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RossPPC14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/FardP14,
  author       = {Mahdi Milani Fard and
                  Joelle Pineau},
  title        = {Non-Deterministic Policies in Markovian Decision Processes},
  journal      = {CoRR},
  volume       = {abs/1401.3871},
  year         = {2014},
  url          = {http://arxiv.org/abs/1401.3871},
  eprinttype    = {arXiv},
  eprint       = {1401.3871},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/FardP14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AlsharifBP14,
  author       = {Ouais Alsharif and
                  Philip Bachman and
                  Joelle Pineau},
  title        = {Lifelong Learning of Discriminative Representations},
  journal      = {CoRR},
  volume       = {abs/1404.4108},
  year         = {2014},
  url          = {http://arxiv.org/abs/1404.4108},
  eprinttype    = {arXiv},
  eprint       = {1404.4108},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AlsharifBP14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BarretoPP14,
  author       = {Andr{\'{e}} da Motta Salles Barreto and
                  Doina Precup and
                  Joelle Pineau},
  title        = {Practical Kernel-Based Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1407.5358},
  year         = {2014},
  url          = {http://arxiv.org/abs/1407.5358},
  eprinttype    = {arXiv},
  eprint       = {1407.5358},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BarretoPP14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/ShaniPK13,
  author       = {Guy Shani and
                  Joelle Pineau and
                  Robert Kaplow},
  title        = {A survey of point-based {POMDP} solvers},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {27},
  number       = {1},
  pages        = {1--51},
  year         = {2013},
  url          = {https://doi.org/10.1007/s10458-012-9200-2},
  doi          = {10.1007/S10458-012-9200-2},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aamas/ShaniPK13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/FrankMPP13,
  author       = {Jordan Frank and
                  Shie Mannor and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Time Series Analysis Using Geometric Template Matching},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {35},
  number       = {3},
  pages        = {740--754},
  year         = {2013},
  url          = {https://doi.org/10.1109/TPAMI.2012.121},
  doi          = {10.1109/TPAMI.2012.121},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pami/FrankMPP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/OngGP13,
  author       = {Sylvie C. W. Ong and
                  Yuri Grinberg and
                  Joelle Pineau},
  editor       = {Marie desJardins and
                  Michael L. Littman},
  title        = {Mixed Observability Predictive State Representations},
  booktitle    = {Proceedings of the Twenty-Seventh {AAAI} Conference on Artificial
                  Intelligence, July 14-18, 2013, Bellevue, Washington, {USA}},
  pages        = {746--752},
  publisher    = {{AAAI} Press},
  year         = {2013},
  url          = {https://doi.org/10.1609/aaai.v27i1.8680},
  doi          = {10.1609/AAAI.V27I1.8680},
  timestamp    = {Mon, 04 Sep 2023 15:56:33 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/OngGP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/Pineau13,
  author       = {Joelle Pineau},
  title        = {Designing Intelligent Wheelchairs: Reintegrating {AI}},
  booktitle    = {Designing Intelligent Robots: Reintegrating {AI} II, Papers from the
                  2013 {AAAI} Spring Symposium, Palo Alto, California, USA, March 25-27,
                  2013},
  series       = {{AAAI} Technical Report},
  volume       = {{SS-13-04}},
  publisher    = {{AAAI}},
  year         = {2013},
  url          = {http://www.aaai.org/ocs/index.php/SSS/SSS13/paper/view/5783},
  timestamp    = {Mon, 09 Sep 2013 15:13:13 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaiss/Pineau13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/HamiltonFP13,
  author       = {William L. Hamilton and
                  Mahdi Milani Fard and
                  Joelle Pineau},
  title        = {Modelling Sparse Dynamical Systems with Compressed Predictive State
                  Representations},
  booktitle    = {Proceedings of the 30th International Conference on Machine Learning,
                  {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {28},
  pages        = {178--186},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v28/hamilton13.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/HamiltonFP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KimFPP13,
  author       = {Beomjoon Kim and
                  Amir{-}massoud Farahmand and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Zoubin Ghahramani and
                  Kilian Q. Weinberger},
  title        = {Learning from Limited Demonstrations},
  booktitle    = {Advances in Neural Information Processing Systems 26: 27th Annual
                  Conference on Neural Information Processing Systems 2013. Proceedings
                  of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  pages        = {2859--2867},
  year         = {2013},
  url          = {https://proceedings.neurips.cc/paper/2013/hash/fd5c905bcd8c3348ad1b35d7231ee2b1-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/KimFPP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/FardGFPP13,
  author       = {Mahdi Milani Fard and
                  Yuri Grinberg and
                  Amir{-}massoud Farahmand and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Zoubin Ghahramani and
                  Kilian Q. Weinberger},
  title        = {Bellman Error Based Feature Generation using Random Projections on
                  Sparse Spaces},
  booktitle    = {Advances in Neural Information Processing Systems 26: 27th Annual
                  Conference on Neural Information Processing Systems 2013. Proceedings
                  of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  pages        = {3030--3038},
  year         = {2013},
  url          = {https://proceedings.neurips.cc/paper/2013/hash/86e8f7ab32cfd12577bc2619bc635690-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/FardGFPP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rss/KimP13,
  author       = {Beomjoon Kim and
                  Joelle Pineau},
  editor       = {Paul Newman and
                  Dieter Fox and
                  David Hsu},
  title        = {Maximum Mean Discrepancy Imitation Learning},
  booktitle    = {Robotics: Science and Systems IX, Technische Universit{\"{a}}t
                  Berlin, Berlin, Germany, June 24 - June 28, 2013},
  year         = {2013},
  url          = {http://www.roboticsproceedings.org/rss09/p38.html},
  doi          = {10.15607/RSS.2013.IX.038},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/rss/KimP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/WangP13,
  author       = {Boyu Wang and
                  Joelle Pineau},
  title        = {Online Ensemble Learning for Imbalanced Data Streams},
  journal      = {CoRR},
  volume       = {abs/1310.8004},
  year         = {2013},
  url          = {http://arxiv.org/abs/1310.8004},
  eprinttype    = {arXiv},
  eprint       = {1310.8004},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/WangP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HamiltonFP13,
  author       = {William L. Hamilton and
                  Mahdi Milani Fard and
                  Joelle Pineau},
  title        = {Efficient Learning and Planning with Compressed Predictive States},
  journal      = {CoRR},
  volume       = {abs/1312.0286},
  year         = {2013},
  url          = {http://arxiv.org/abs/1312.0286},
  eprinttype    = {arXiv},
  eprint       = {1312.0286},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HamiltonFP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/Doshi-VelezPR12,
  author       = {Finale Doshi{-}Velez and
                  Joelle Pineau and
                  Nicholas Roy},
  title        = {Reinforcement learning with limited reinforcement: Using Bayes risk
                  for active learning in POMDPs},
  journal      = {Artif. Intell.},
  volume       = {187},
  pages        = {115--132},
  year         = {2012},
  url          = {https://doi.org/10.1016/j.artint.2012.04.006},
  doi          = {10.1016/J.ARTINT.2012.04.006},
  timestamp    = {Sat, 27 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ai/Doshi-VelezPR12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jstsp/PngPC12,
  author       = {ShaoWei Png and
                  Joelle Pineau and
                  Brahim Chaib{-}draa},
  title        = {Building Adaptive Dialogue Systems Via Bayes-Adaptive POMDPs},
  journal      = {{IEEE} J. Sel. Top. Signal Process.},
  volume       = {6},
  number       = {8},
  pages        = {917--927},
  year         = {2012},
  url          = {https://doi.org/10.1109/JSTSP.2012.2229962},
  doi          = {10.1109/JSTSP.2012.2229962},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jstsp/PngPC12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/FardGPP12,
  author       = {Mahdi Milani Fard and
                  Yuri Grinberg and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {J{\"{o}}rg Hoffmann and
                  Bart Selman},
  title        = {Compressed Least-Squares Regression on Sparse Spaces},
  booktitle    = {Proceedings of the Twenty-Sixth {AAAI} Conference on Artificial Intelligence,
                  July 22-26, 2012, Toronto, Ontario, Canada},
  pages        = {1054--1060},
  publisher    = {{AAAI} Press},
  year         = {2012},
  url          = {https://doi.org/10.1609/aaai.v26i1.8303},
  doi          = {10.1609/AAAI.V26I1.8303},
  timestamp    = {Mon, 04 Sep 2023 15:56:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/FardGPP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/crv/TsangOP12,
  author       = {Emily Tsang and
                  Sylvie C. W. Ong and
                  Joelle Pineau},
  title        = {Design and Evaluation of a Flexible Interface for Spatial Navigation},
  booktitle    = {Ninth Conference on Computer and Robot Vision, {CRV} 2012, Toronto,
                  Ontario, Canada, May 28-30, 2012},
  pages        = {353--360},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/CRV.2012.53},
  doi          = {10.1109/CRV.2012.53},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/crv/TsangOP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ewrl/PaduraruPPC12,
  author       = {Cosmin Paduraru and
                  Doina Precup and
                  Joelle Pineau and
                  Gheorghe Comanici},
  editor       = {Marc Peter Deisenroth and
                  Csaba Szepesv{\'{a}}ri and
                  Jan Peters},
  title        = {An Empirical Analysis of Off-policy Learning in Discrete MDPs},
  booktitle    = {Proceedings of the Tenth European Workshop on Reinforcement Learning,
                  {EWRL} 2012, Edinburgh, Scotland, UK, June, 2012},
  series       = {{JMLR} Proceedings},
  volume       = {24},
  pages        = {89--102},
  publisher    = {JMLR.org},
  year         = {2012},
  url          = {http://proceedings.mlr.press/v24/paduraru12a.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/conf/ewrl/PaduraruPPC12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BarretoPP12,
  author       = {Andr{\'{e}} da Motta Salles Barreto and
                  Doina Precup and
                  Joelle Pineau},
  editor       = {Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Kilian Q. Weinberger},
  title        = {On-line Reinforcement Learning Using Incremental Kernel-Based Stochastic
                  Factorization},
  booktitle    = {Advances in Neural Information Processing Systems 25: 26th Annual
                  Conference on Neural Information Processing Systems 2012. Proceedings
                  of a meeting held December 3-6, 2012, Lake Tahoe, Nevada, United States},
  pages        = {1493--1501},
  year         = {2012},
  url          = {https://proceedings.neurips.cc/paper/2012/hash/1ecfb463472ec9115b10c292ef8bc986-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BarretoPP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1202-3714,
  author       = {Kun Deng and
                  Joelle Pineau and
                  Susan A. Murphy},
  title        = {Active Learning for Developing Personalized Treatment},
  journal      = {CoRR},
  volume       = {abs/1202.3714},
  year         = {2012},
  url          = {http://arxiv.org/abs/1202.3714},
  eprinttype    = {arXiv},
  eprint       = {1202.3714},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1202-3714.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1202-3717,
  author       = {Mahdi Milani Fard and
                  Joelle Pineau and
                  Csaba Szepesv{\'{a}}ri},
  title        = {PAC-Bayesian Policy Evaluation for Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1202.3717},
  year         = {2012},
  url          = {http://arxiv.org/abs/1202.3717},
  eprinttype    = {arXiv},
  eprint       = {1202.3717},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1202-3717.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1206-3281,
  author       = {St{\'{e}}phane Ross and
                  Joelle Pineau},
  title        = {Model-Based Bayesian Reinforcement Learning in Large Structured Domains},
  journal      = {CoRR},
  volume       = {abs/1206.3281},
  year         = {2012},
  url          = {http://arxiv.org/abs/1206.3281},
  eprinttype    = {arXiv},
  eprint       = {1206.3281},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1206-3281.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1207-4676,
  author       = {John Langford and
                  Joelle Pineau},
  title        = {Proceedings of the 29th International Conference on Machine Learning
                  {(ICML-12)}},
  journal      = {CoRR},
  volume       = {abs/1207.4676},
  year         = {2012},
  url          = {http://arxiv.org/abs/1207.4676},
  eprinttype    = {arXiv},
  eprint       = {1207.4676},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1207-4676.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1207-5554,
  author       = {Mahdi Milani Fard and
                  Yuri Grinberg and
                  Amir Massoud Farahmand and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Bellman Error Based Feature Generation using Random Projections on
                  Sparse Spaces},
  journal      = {CoRR},
  volume       = {abs/1207.5554},
  year         = {2012},
  url          = {http://arxiv.org/abs/1207.5554},
  eprinttype    = {arXiv},
  eprint       = {1207.5554},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1207-5554.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1212-2495,
  author       = {Joelle Pineau and
                  Geoffrey J. Gordon and
                  Sebastian Thrun},
  title        = {Policy-contingent abstraction for robust robot control},
  journal      = {CoRR},
  volume       = {abs/1212.2495},
  year         = {2012},
  url          = {http://arxiv.org/abs/1212.2495},
  eprinttype    = {arXiv},
  eprint       = {1212.2495},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1212-2495.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/FardP11,
  author       = {Mahdi Milani Fard and
                  Joelle Pineau},
  title        = {Non-Deterministic Policies in Markovian Decision Processes},
  journal      = {J. Artif. Intell. Res.},
  volume       = {40},
  pages        = {1--24},
  year         = {2011},
  url          = {https://doi.org/10.1613/jair.3175},
  doi          = {10.1613/JAIR.3175},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jair/FardP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/RossPCK11,
  author       = {St{\'{e}}phane Ross and
                  Joelle Pineau and
                  Brahim Chaib{-}draa and
                  Pierre Kreitmann},
  title        = {A Bayesian Approach for Learning and Planning in Partially Observable
                  Markov Decision Processes},
  journal      = {J. Mach. Learn. Res.},
  volume       = {12},
  pages        = {1729--1770},
  year         = {2011},
  url          = {https://dl.acm.org/doi/10.5555/1953048.2021055},
  doi          = {10.5555/1953048.2021055},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/RossPCK11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/ShortreedLLSPM11,
  author       = {Susan M. Shortreed and
                  Eric B. Laber and
                  Daniel J. Lizotte and
                  T. Scott Stroup and
                  Joelle Pineau and
                  Susan A. Murphy},
  title        = {Informing sequential clinical decision-making through reinforcement
                  learning: an empirical study},
  journal      = {Mach. Learn.},
  volume       = {84},
  number       = {1-2},
  pages        = {109--136},
  year         = {2011},
  url          = {https://doi.org/10.1007/s10994-010-5229-0},
  doi          = {10.1007/S10994-010-5229-0},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ml/ShortreedLLSPM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/VincentCP11,
  author       = {Robert D. Vincent and
                  Aaron C. Courville and
                  Joelle Pineau},
  title        = {A bistable computational model of recurring epileptiform activity
                  as observed in rodent slice preparations},
  journal      = {Neural Networks},
  volume       = {24},
  number       = {6},
  pages        = {526--537},
  year         = {2011},
  url          = {https://doi.org/10.1016/j.neunet.2011.03.003},
  doi          = {10.1016/J.NEUNET.2011.03.003},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nn/VincentCP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/SaulnierP11,
  author       = {Guillaume Saulnier and
                  Joelle Pineau},
  title        = {Automatic Seizure Detection in an In-Vivo Model of Epilepsy},
  booktitle    = {Computational Physiology, Papers from the 2011 {AAAI} Spring Symposium,
                  Technical Report SS-11-04, Stanford, California, USA, March 21-23,
                  2011},
  publisher    = {{AAAI}},
  year         = {2011},
  url          = {http://www.aaai.org/ocs/index.php/SSS/SSS11/paper/view/2468},
  timestamp    = {Mon, 13 Feb 2012 17:06:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/SaulnierP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/adprl/DengPM11,
  author       = {Kun Deng and
                  Joelle Pineau and
                  Susan A. Murphy},
  title        = {Active learning for personalizing treatment},
  booktitle    = {2011 {IEEE} Symposium on Adaptive Dynamic Programming And Reinforcement
                  Learning, {ADPRL} 2011, Paris, France, April 12-14, 2011},
  pages        = {32--39},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ADPRL.2011.5967348},
  doi          = {10.1109/ADPRL.2011.5967348},
  timestamp    = {Wed, 16 Oct 2019 14:14:48 +0200},
  biburl       = {https://dblp.org/rec/conf/adprl/DengPM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/embc/MoghaddamPFARAP11,
  author       = {Athena K. Moghaddam and
                  Joelle Pineau and
                  Jordan Frank and
                  Philippe S. Archambault and
                  Fran{\c{c}}ois Routhier and
                  Therese Audet and
                  Jan Polgar and
                  Fran{\c{c}}ois Michaud and
                  Patrick Boissy},
  title        = {Mobility profile and wheelchair driving skills of powered wheelchair
                  users: Sensor-based event recognition using a support vector machine
                  classifier},
  booktitle    = {33rd Annual International Conference of the {IEEE} Engineering in
                  Medicine and Biology Society, {EMBC} 2011, Boston, MA, USA, August
                  30 - Sept. 3, 2011},
  pages        = {7336--7339},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/IEMBS.2011.6091711},
  doi          = {10.1109/IEMBS.2011.6091711},
  timestamp    = {Fri, 26 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/embc/MoghaddamPFARAP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ewrl/OngGP11,
  author       = {Sylvie C. W. Ong and
                  Yuri Grinberg and
                  Joelle Pineau},
  editor       = {Scott Sanner and
                  Marcus Hutter},
  title        = {Goal-Directed Online Learning of Predictive Models},
  booktitle    = {Recent Advances in Reinforcement Learning - 9th European Workshop,
                  {EWRL} 2011, Athens, Greece, September 9-11, 2011, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {7188},
  pages        = {18--29},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-29946-9\_6},
  doi          = {10.1007/978-3-642-29946-9\_6},
  timestamp    = {Tue, 14 May 2019 10:00:48 +0200},
  biburl       = {https://dblp.org/rec/conf/ewrl/OngGP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ewrl/PaduraruPP11,
  author       = {Cosmin Paduraru and
                  Doina Precup and
                  Joelle Pineau},
  editor       = {Scott Sanner and
                  Marcus Hutter},
  title        = {A Framework for Computing Bounds for the Return of a Policy},
  booktitle    = {Recent Advances in Reinforcement Learning - 9th European Workshop,
                  {EWRL} 2011, Athens, Greece, September 9-11, 2011, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {7188},
  pages        = {201--212},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-29946-9\_21},
  doi          = {10.1007/978-3-642-29946-9\_21},
  timestamp    = {Tue, 23 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ewrl/PaduraruPP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PngP11,
  author       = {ShaoWei Png and
                  Joelle Pineau},
  title        = {Bayesian reinforcement learning for POMDP-based dialogue systems},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {2156--2159},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5946754},
  doi          = {10.1109/ICASSP.2011.5946754},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PngP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BarretoPP11,
  author       = {Andr{\'{e}} da Motta Salles Barreto and
                  Doina Precup and
                  Joelle Pineau},
  editor       = {John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Kilian Q. Weinberger},
  title        = {Reinforcement Learning using Kernel-Based Stochastic Factorization},
  booktitle    = {Advances in Neural Information Processing Systems 24: 25th Annual
                  Conference on Neural Information Processing Systems 2011. Proceedings
                  of a meeting held 12-14 December 2011, Granada, Spain},
  pages        = {720--728},
  year         = {2011},
  url          = {https://proceedings.neurips.cc/paper/2011/hash/b534ba68236ba543ae44b22bd110a1d6-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BarretoPP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/tbillc/DinculescuHPPP11,
  author       = {Monica Dinculescu and
                  Christopher Hundt and
                  Prakash Panangaden and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Guram Bezhanishvili and
                  Sebastian L{\"{o}}bner and
                  Vincenzo Marra and
                  Frank Richter},
  title        = {The Duality of State and Observation in Probabilistic Transition Systems},
  booktitle    = {Logic, Language, and Computation - 9th International Tbilisi Symposium
                  on Logic, Language, and Computation, TbiLLC 2011, Kutaisi, Georgia,
                  September 26-30, 2011, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {7758},
  pages        = {206--230},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-36976-6\_14},
  doi          = {10.1007/978-3-642-36976-6\_14},
  timestamp    = {Tue, 14 May 2019 10:00:54 +0200},
  biburl       = {https://dblp.org/rec/conf/tbillc/DinculescuHPPP11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/DengPM11,
  author       = {Kun Deng and
                  Joelle Pineau and
                  Susan A. Murphy},
  editor       = {F{\'{a}}bio Gagliardi Cozman and
                  Avi Pfeffer},
  title        = {Active Learning for Developing Personalized Treatment},
  booktitle    = {{UAI} 2011, Proceedings of the Twenty-Seventh Conference on Uncertainty
                  in Artificial Intelligence, Barcelona, Spain, July 14-17, 2011},
  pages        = {161--168},
  publisher    = {{AUAI} Press},
  year         = {2011},
  url          = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=2196\&\#38;proceeding\_id=27},
  timestamp    = {Wed, 03 Feb 2021 11:09:03 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/DengPM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/FardPS11,
  author       = {Mahdi Milani Fard and
                  Joelle Pineau and
                  Csaba Szepesv{\'{a}}ri},
  editor       = {F{\'{a}}bio Gagliardi Cozman and
                  Avi Pfeffer},
  title        = {PAC-Bayesian Policy Evaluation for Reinforcement Learning},
  booktitle    = {{UAI} 2011, Proceedings of the Twenty-Seventh Conference on Uncertainty
                  in Artificial Intelligence, Barcelona, Spain, July 14-17, 2011},
  pages        = {195--202},
  publisher    = {{AUAI} Press},
  year         = {2011},
  url          = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=2218\&\#38;proceeding\_id=27},
  timestamp    = {Wed, 03 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/FardPS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1110-0027,
  author       = {Joelle Pineau and
                  Geoffrey J. Gordon and
                  Sebastian Thrun},
  title        = {Anytime Point-Based Approximations for Large POMDPs},
  journal      = {CoRR},
  volume       = {abs/1110.0027},
  year         = {2011},
  url          = {http://arxiv.org/abs/1110.0027},
  eprinttype    = {arXiv},
  eprint       = {1110.0027},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1110-0027.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/BushP10,
  author       = {Keith Bush and
                  Joelle Pineau},
  title        = {Treating Epilepsy by Reinforcement Learning Via Manifold-Based Simulation},
  booktitle    = {Manifold Learning and Its Applications, Papers from the 2010 {AAAI}
                  Fall Symposium, Arlington, Virginia, USA, November 11-13, 2010},
  series       = {{AAAI} Technical Report},
  volume       = {{FS-10-06}},
  publisher    = {{AAAI}},
  year         = {2010},
  url          = {http://www.aaai.org/ocs/index.php/FSS/FSS10/paper/view/2263},
  timestamp    = {Thu, 26 Sep 2013 15:55:57 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaifs/BushP10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/WestPP10,
  author       = {Robert West and
                  Doina Precup and
                  Joelle Pineau},
  editor       = {Jimmy X. Huang and
                  Nick Koudas and
                  Gareth J. F. Jones and
                  Xindong Wu and
                  Kevyn Collins{-}Thompson and
                  Aijun An},
  title        = {Automatically suggesting topics for augmenting text documents},
  booktitle    = {Proceedings of the 19th {ACM} Conference on Information and Knowledge
                  Management, {CIKM} 2010, Toronto, Ontario, Canada, October 26-30,
                  2010},
  pages        = {929--938},
  publisher    = {{ACM}},
  year         = {2010},
  url          = {https://doi.org/10.1145/1871437.1871556},
  doi          = {10.1145/1871437.1871556},
  timestamp    = {Wed, 03 Aug 2022 15:48:33 +0200},
  biburl       = {https://dblp.org/rec/conf/cikm/WestPP10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/KaplowAP10,
  author       = {Robert Kaplow and
                  Amin Atrash and
                  Joelle Pineau},
  title        = {Variable resolution decomposition for robotic navigation under a {POMDP}
                  framework},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2010, Anchorage, Alaska, USA, 3-7 May 2010},
  pages        = {369--376},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ROBOT.2010.5509188},
  doi          = {10.1109/ROBOT.2010.5509188},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/KaplowAP10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/GuezP10,
  author       = {Arthur Guez and
                  Joelle Pineau},
  title        = {Multi-tasking {SLAM}},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2010, Anchorage, Alaska, USA, 3-7 May 2010},
  pages        = {377--384},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ROBOT.2010.5509969},
  doi          = {10.1109/ROBOT.2010.5509969},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/GuezP10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/FardP10,
  author       = {Mahdi Milani Fard and
                  Joelle Pineau},
  editor       = {John D. Lafferty and
                  Christopher K. I. Williams and
                  John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Aron Culotta},
  title        = {PAC-Bayesian Model Selection for Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 23: 24th Annual
                  Conference on Neural Information Processing Systems 2010. Proceedings
                  of a meeting held 6-9 December 2010, Vancouver, British Columbia,
                  Canada},
  pages        = {1624--1632},
  publisher    = {Curran Associates, Inc.},
  year         = {2010},
  url          = {https://proceedings.neurips.cc/paper/2010/hash/66368270ffd51418ec58bd793f2d9b1b-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/FardP10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/permis/Pineau0AVR10,
  author       = {Joelle Pineau and
                  Robert West and
                  Amin Atrash and
                  Julien Villemure and
                  Fran{\c{c}}ois Routhier},
  editor       = {Elena Messina and
                  Raj Madhavan},
  title        = {Towards a standardized test for intelligent wheelchairs},
  booktitle    = {Proceedings of the 10th Performance Metrics for Intelligent Systems
                  Workshop, PerMIS 2010, Baltimore, Maryland, USA, September 28-30,
                  2010},
  pages        = {169--174},
  publisher    = {{ACM}},
  year         = {2010},
  url          = {https://doi.org/10.1145/2377576.2377607},
  doi          = {10.1145/2377576.2377607},
  timestamp    = {Wed, 04 Nov 2020 08:42:47 +0100},
  biburl       = {https://dblp.org/rec/conf/permis/Pineau0AVR10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/BunescuCCCCDDDFGGGHJJKKKLLMMMMPPRRSSSATWSWZ09,
  author       = {Razvan C. Bunescu and
                  Vitor R. Carvalho and
                  Jan Chomicki and
                  Vincent Conitzer and
                  Michael T. Cox and
                  Virginia Dignum and
                  Zachary Dodds and
                  Mark Dredze and
                  David Furcy and
                  Evgeniy Gabrilovich and
                  Mehmet H. G{\"{o}}ker and
                  Hans W. Guesgen and
                  Haym Hirsh and
                  Dietmar Jannach and
                  Ulrich Junker and
                  Wolfgang Ketter and
                  Alfred Kobsa and
                  Sven Koenig and
                  Tessa A. Lau and
                  Lundy Lewis and
                  Eric T. Matson and
                  Ted Metzler and
                  Rada Mihalcea and
                  Bamshad Mobasher and
                  Joelle Pineau and
                  Pascal Poupart and
                  Anita Raja and
                  Wheeler Ruml and
                  Norman M. Sadeh and
                  Guy Shani and
                  Daniel G. Shapiro and
                  Sarabjot Singh Anand and
                  Matthew E. Taylor and
                  Kiri Wagstaff and
                  Trey Smith and
                  William E. Walsh and
                  Rong Zhou},
  title        = {{AAAI} 2008 Workshop Reports},
  journal      = {{AI} Mag.},
  volume       = {30},
  number       = {1},
  pages        = {108--118},
  year         = {2009},
  url          = {https://doi.org/10.1609/aimag.v30i1.2196},
  doi          = {10.1609/AIMAG.V30I1.2196},
  timestamp    = {Sun, 04 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/BunescuCCCCDDDFGGGHJJKKKLLMMMMPPRRSSSATWSWZ09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijns/PineauGVPA09,
  author       = {Joelle Pineau and
                  Arthur Guez and
                  Robert D. Vincent and
                  Gabriella Panuccio and
                  Massimo Avoli},
  title        = {Treating Epilepsy via Adaptive Neurostimulation: a Reinforcement Learning
                  Approach},
  journal      = {Int. J. Neural Syst.},
  volume       = {19},
  number       = {4},
  pages        = {227--240},
  year         = {2009},
  url          = {https://doi.org/10.1142/S0129065709001987},
  doi          = {10.1142/S0129065709001987},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijns/PineauGVPA09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijsr/AtrashKVWYP09,
  author       = {Amin Atrash and
                  Robert Kaplow and
                  Julien Villemure and
                  Robert West and
                  Hiba Yamani and
                  Joelle Pineau},
  title        = {Development and Validation of a Robust Speech Interface for Improved
                  Human-Robot Interaction},
  journal      = {Int. J. Soc. Robotics},
  volume       = {1},
  number       = {4},
  pages        = {345--356},
  year         = {2009},
  url          = {https://doi.org/10.1007/s12369-009-0032-4},
  doi          = {10.1007/S12369-009-0032-4},
  timestamp    = {Sat, 25 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijsr/AtrashKVWYP09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/WestPP09,
  author       = {Robert West and
                  Doina Precup and
                  Joelle Pineau},
  editor       = {David Wai{-}Lok Cheung and
                  Il{-}Yeol Song and
                  Wesley W. Chu and
                  Xiaohua Hu and
                  Jimmy Lin},
  title        = {Completing wikipedia's hyperlink structure through dimensionality
                  reduction},
  booktitle    = {Proceedings of the 18th {ACM} Conference on Information and Knowledge
                  Management, {CIKM} 2009, Hong Kong, China, November 2-6, 2009},
  pages        = {1097--1106},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1645953.1646093},
  doi          = {10.1145/1645953.1646093},
  timestamp    = {Fri, 27 Aug 2021 11:13:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cikm/WestPP09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/WestPP09,
  author       = {Robert West and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Craig Boutilier},
  title        = {Wikispeedia: An Online Game for Inferring Semantic Distances between
                  Concepts},
  booktitle    = {{IJCAI} 2009, Proceedings of the 21st International Joint Conference
                  on Artificial Intelligence, Pasadena, California, USA, July 11-17,
                  2009},
  pages        = {1598--1603},
  year         = {2009},
  url          = {http://ijcai.org/Proceedings/09/Papers/267.pdf},
  timestamp    = {Tue, 20 Aug 2019 16:16:40 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/WestPP09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iui/AtrashP09,
  author       = {Amin Atrash and
                  Joelle Pineau},
  editor       = {Cristina Conati and
                  Mathias Bauer and
                  Nuria Oliver and
                  Daniel S. Weld},
  title        = {A bayesian reinforcement learning approach for customizing human-robot
                  interfaces},
  booktitle    = {Proceedings of the 14th International Conference on Intelligent User
                  Interfaces, {IUI} 2009, Sanibel Island, Florida, USA, February 8-11,
                  2009},
  pages        = {355--360},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1502650.1502700},
  doi          = {10.1145/1502650.1502700},
  timestamp    = {Tue, 06 Nov 2018 11:07:41 +0100},
  biburl       = {https://dblp.org/rec/conf/iui/AtrashP09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BushP09,
  author       = {Keith Bush and
                  Joelle Pineau},
  editor       = {Yoshua Bengio and
                  Dale Schuurmans and
                  John D. Lafferty and
                  Christopher K. I. Williams and
                  Aron Culotta},
  title        = {Manifold Embeddings for Model-Based Reinforcement Learning under Partial
                  Observability},
  booktitle    = {Advances in Neural Information Processing Systems 22: 23rd Annual
                  Conference on Neural Information Processing Systems 2009. Proceedings
                  of a meeting held 7-10 December 2009, Vancouver, British Columbia,
                  Canada},
  pages        = {189--197},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2009/hash/a2557a7b2e94197ff767970b67041697-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BushP09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/RossPPC08,
  author       = {St{\'{e}}phane Ross and
                  Joelle Pineau and
                  S{\'{e}}bastien Paquet and
                  Brahim Chaib{-}draa},
  title        = {Online Planning Algorithms for POMDPs},
  journal      = {J. Artif. Intell. Res.},
  volume       = {32},
  pages        = {663--704},
  year         = {2008},
  url          = {https://doi.org/10.1613/jair.2567},
  doi          = {10.1613/JAIR.2567},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/RossPPC08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/FardPS08,
  author       = {Mahdi Milani Fard and
                  Joelle Pineau and
                  Peng Sun},
  editor       = {Dieter Fox and
                  Carla P. Gomes},
  title        = {A Variance Analysis for {POMDP} Policy Evaluation},
  booktitle    = {Proceedings of the Twenty-Third {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2008, Chicago, Illinois, USA, July 13-17, 2008},
  pages        = {1056--1061},
  publisher    = {{AAAI} Press},
  year         = {2008},
  url          = {http://www.aaai.org/Library/AAAI/2008/aaai08-167.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/FardPS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/GuezVAP08,
  author       = {Arthur Guez and
                  Robert D. Vincent and
                  Massimo Avoli and
                  Joelle Pineau},
  editor       = {Dieter Fox and
                  Carla P. Gomes},
  title        = {Adaptive Treatment of Epilepsy via Batch-mode Reinforcement Learning},
  booktitle    = {Proceedings of the Twenty-Third {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2008, Chicago, Illinois, USA, July 13-17, 2008},
  pages        = {1671--1678},
  publisher    = {{AAAI} Press},
  year         = {2008},
  url          = {http://www.aaai.org/Library/IAAI/2008/iaai08-008.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/GuezVAP08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DoshiPR08,
  author       = {Finale Doshi and
                  Joelle Pineau and
                  Nicholas Roy},
  editor       = {William W. Cohen and
                  Andrew McCallum and
                  Sam T. Roweis},
  title        = {Reinforcement learning with limited reinforcement: using Bayes risk
                  for active learning in POMDPs},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Fifth International Conference
                  {(ICML} 2008), Helsinki, Finland, June 5-9, 2008},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {307},
  pages        = {256--263},
  publisher    = {{ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1145/1390156.1390189},
  doi          = {10.1145/1390156.1390189},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/DoshiPR08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/RossCP08,
  author       = {St{\'{e}}phane Ross and
                  Brahim Chaib{-}draa and
                  Joelle Pineau},
  title        = {Bayesian reinforcement learning in continuous POMDPs with application
                  to robot navigation},
  booktitle    = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2008, May 19-23, 2008, Pasadena, California, {USA}},
  pages        = {2845--2851},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ROBOT.2008.4543641},
  doi          = {10.1109/ROBOT.2008.4543641},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/RossCP08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isaim/DoshiPR08,
  author       = {Finale Doshi and
                  Joelle Pineau and
                  Nicholas Roy},
  title        = {Reinforcement Learning with Limited Reinforcement: Using Bayes Risk
                  for Active Learning in POMDPs},
  booktitle    = {International Symposium on Artificial Intelligence and Mathematics,
                  {ISAIM} 2008, Fort Lauderdale, Florida, USA, January 2-4, 2008},
  year         = {2008},
  url          = {http://isaim2008.unl.edu/PAPERS/TechnicalProgram/ISAIM2008\_0044\_849d5727b40e38c8777f196c57cb519e.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isaim/DoshiPR08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isaim/PineauRC08,
  author       = {Joelle Pineau and
                  St{\'{e}}phane Ross and
                  Brahim Chaib{-}draa},
  title        = {Bayes-Adaptive POMDPs: {A} New Perspective on the Explore-Exploit
                  Tradeoff in Partially Observable Domains},
  booktitle    = {International Symposium on Artificial Intelligence and Mathematics,
                  {ISAIM} 2008, Fort Lauderdale, Florida, USA, January 2-4, 2008},
  year         = {2008},
  url          = {http://isaim2008.unl.edu/PAPERS/SS3-ActiveLearning/jpineau-isaim08.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isaim/PineauRC08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/FardP08,
  author       = {Mahdi Milani Fard and
                  Joelle Pineau},
  editor       = {Daphne Koller and
                  Dale Schuurmans and
                  Yoshua Bengio and
                  L{\'{e}}on Bottou},
  title        = {MDPs with Non-Deterministic Policies},
  booktitle    = {Advances in Neural Information Processing Systems 21, Proceedings
                  of the Twenty-Second Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 8-11, 2008},
  pages        = {1065--1072},
  publisher    = {Curran Associates, Inc.},
  year         = {2008},
  url          = {https://proceedings.neurips.cc/paper/2008/hash/0c74b7f78409a4022a2c4c5a5ca3ee19-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/FardP08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/RossP08,
  author       = {St{\'{e}}phane Ross and
                  Joelle Pineau},
  editor       = {David A. McAllester and
                  Petri Myllym{\"{a}}ki},
  title        = {Model-Based Bayesian Reinforcement Learning in Large Structured Domains},
  booktitle    = {{UAI} 2008, Proceedings of the 24th Conference in Uncertainty in Artificial
                  Intelligence, Helsinki, Finland, July 9-12, 2008},
  pages        = {476--483},
  publisher    = {{AUAI} Press},
  year         = {2008},
  url          = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=1967\&\#38;proceeding\_id=24},
  timestamp    = {Wed, 03 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/RossP08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ria/JaulmesPP07,
  author       = {Robin Jaulmes and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Apprentissage actif dans les processus d{\'{e}}cisionnels de
                  Markov partiellement observables L'algorithme {MEDUSA}},
  journal      = {Rev. d'Intelligence Artif.},
  volume       = {21},
  number       = {1},
  pages        = {9--34},
  year         = {2007},
  url          = {https://doi.org/10.3166/ria.21.9-33},
  doi          = {10.3166/RIA.21.9-33},
  timestamp    = {Wed, 16 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ria/JaulmesPP07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/HundtPPP07,
  author       = {Christopher Hundt and
                  Prakash Panangaden and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Clayton T. Morrison and
                  Tim Oates},
  title        = {Representing Systems with Hidden State},
  booktitle    = {Computational Approaches to Representation Change during Learning
                  and Development, Papers from the 2007 {AAAI} Fall Symposium, Arlington,
                  Virginia, USA, November 9-11, 2007},
  series       = {{AAAI} Technical Report},
  volume       = {{FS-07-03}},
  pages        = {17--23},
  publisher    = {{AAAI} Press},
  year         = {2007},
  url          = {https://www.aaai.org/Library/Symposia/Fall/2007/fs07-03-003.php},
  timestamp    = {Sun, 16 Oct 2022 14:19:55 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaifs/HundtPPP07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/PineauA07,
  author       = {Joelle Pineau and
                  Amin Atrash},
  title        = {SmartWheeler: {A} Robotic Wheelchair Test-Bed for Investigating New
                  Models of Human-Robot Interaction},
  booktitle    = {Multidisciplinary Collaboration for Socially Assistive Robotics, Papers
                  from the 2007 {AAAI} Spring Symposium, Technical Report SS-07-07,
                  Stanford, California, USA, March 26-28, 2007},
  pages        = {59--64},
  publisher    = {{AAAI}},
  year         = {2007},
  url          = {http://www.aaai.org/Library/Symposia/Spring/2007/ss07-07-014.php},
  timestamp    = {Fri, 17 Feb 2012 14:15:32 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/PineauA07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ai/VincentPGA07,
  author       = {Robert D. Vincent and
                  Joelle Pineau and
                  Philip de Guzman and
                  Massimo Avoli},
  editor       = {Ziad Kobti and
                  Dan Wu},
  title        = {Recurrent Boosting for Classification of Natural and Synthetic Time-Series
                  Data},
  booktitle    = {Advances in Artificial Intelligence, 20th Conference of the Canadian
                  Society for Computational Studies of Intelligence, Canadian {AI} 2007,
                  Montreal, Canada, May 28-30, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4509},
  pages        = {192--203},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-72665-4\_17},
  doi          = {10.1007/978-3-540-72665-4\_17},
  timestamp    = {Thu, 28 Sep 2023 12:27:08 +0200},
  biburl       = {https://dblp.org/rec/conf/ai/VincentPGA07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/JaulmesPP07,
  author       = {Robin Jaulmes and
                  Joelle Pineau and
                  Doina Precup},
  title        = {A formal framework for robot learning and control under model uncertainty},
  booktitle    = {2007 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2007, 10-14 April 2007, Roma, Italy},
  pages        = {2104--2110},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ROBOT.2007.363632},
  doi          = {10.1109/ROBOT.2007.363632},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/JaulmesPP07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RossCP07,
  author       = {St{\'{e}}phane Ross and
                  Brahim Chaib{-}draa and
                  Joelle Pineau},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {Bayes-Adaptive POMDPs},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {1225--1232},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/3b3dbaf68507998acd6a5a5254ab2d76-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/RossCP07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RossPC07,
  author       = {St{\'{e}}phane Ross and
                  Joelle Pineau and
                  Brahim Chaib{-}draa},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {Theoretical Analysis of Heuristic Search Methods for Online POMDPs},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {1233--1240},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/138bb0696595b338afbab333c555292a-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/RossPC07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/PineauGT06,
  author       = {Joelle Pineau and
                  Geoffrey J. Gordon and
                  Sebastian Thrun},
  title        = {Anytime Point-Based Approximations for Large POMDPs},
  journal      = {J. Artif. Intell. Res.},
  volume       = {27},
  pages        = {335--380},
  year         = {2006},
  url          = {https://doi.org/10.1613/jair.2078},
  doi          = {10.1613/JAIR.2078},
  timestamp    = {Mon, 21 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/PineauGT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ras/VlassisGP06,
  author       = {Nikos Vlassis and
                  Geoffrey J. Gordon and
                  Joelle Pineau},
  title        = {Planning under uncertainty in robotics},
  journal      = {Robotics Auton. Syst.},
  volume       = {54},
  number       = {11},
  pages        = {885--886},
  year         = {2006},
  url          = {https://doi.org/10.1016/j.robot.2006.06.001},
  doi          = {10.1016/J.ROBOT.2006.06.001},
  timestamp    = {Tue, 12 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ras/VlassisGP06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HundtPPP06,
  author       = {Christopher Hundt and
                  Prakash Panangaden and
                  Joelle Pineau and
                  Doina Precup},
  title        = {Representing Systems with Hidden State},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {368--374},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-059.php},
  timestamp    = {Tue, 05 Sep 2023 09:10:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HundtPPP06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aips/BurfootPD06,
  author       = {Daniel Burfoot and
                  Joelle Pineau and
                  Gregory Dudek},
  editor       = {Derek Long and
                  Stephen F. Smith and
                  Daniel Borrajo and
                  Lee McCluskey},
  title        = {RRT-Plan: {A} Randomized Algorithm for {STRIPS} Planning},
  booktitle    = {Proceedings of the Sixteenth International Conference on Automated
                  Planning and Scheduling, {ICAPS} 2006, Cumbria, UK, June 6-10, 2006},
  pages        = {362--365},
  publisher    = {{AAAI}},
  year         = {2006},
  url          = {http://www.aaai.org/Library/ICAPS/2006/icaps06-041.php},
  timestamp    = {Fri, 05 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aips/BurfootPD06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ecml/GavaldaKPP06,
  author       = {Ricard Gavald{\`{a}} and
                  Philipp W. Keller and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Johannes F{\"{u}}rnkranz and
                  Tobias Scheffer and
                  Myra Spiliopoulou},
  title        = {PAC-Learning of Markov Models with Hidden State},
  booktitle    = {Machine Learning: {ECML} 2006, 17th European Conference on Machine
                  Learning, Berlin, Germany, September 18-22, 2006, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4212},
  pages        = {150--161},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11871842\_18},
  doi          = {10.1007/11871842\_18},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ecml/GavaldaKPP06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ecml/JaulmesPP05,
  author       = {Robin Jaulmes and
                  Joelle Pineau and
                  Doina Precup},
  editor       = {Jo{\~{a}}o Gama and
                  Rui Camacho and
                  Pavel Brazdil and
                  Al{\'{\i}}pio Jorge and
                  Lu{\'{\i}}s Torgo},
  title        = {Active Learning in Partially Observable Markov Decision Processes},
  booktitle    = {Machine Learning: {ECML} 2005, 16th European Conference on Machine
                  Learning, Porto, Portugal, October 3-7, 2005, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3720},
  pages        = {601--608},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11564096\_59},
  doi          = {10.1007/11564096\_59},
  timestamp    = {Wed, 24 Mar 2021 17:12:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ecml/JaulmesPP05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isrr/PineauG05,
  author       = {Joelle Pineau and
                  Geoffrey J. Gordon},
  editor       = {Sebastian Thrun and
                  Rodney A. Brooks and
                  Hugh F. Durrant{-}Whyte},
  title        = {{POMDP} Planning for Robust Robot Control},
  booktitle    = {Robotics Research: Results of the 12th International Symposium, {ISRR}
                  2005, October 12-15, 2005, San Francisco, CA, {USA}},
  series       = {Springer Tracts in Advanced Robotics},
  volume       = {28},
  pages        = {69--82},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/978-3-540-48113-3\_7},
  doi          = {10.1007/978-3-540-48113-3\_7},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isrr/PineauG05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ras/PineauMPRT03,
  author       = {Joelle Pineau and
                  Michael Montemerlo and
                  Martha E. Pollack and
                  Nicholas Roy and
                  Sebastian Thrun},
  title        = {Towards robotic assistants in nursing homes: Challenges and results},
  journal      = {Robotics Auton. Syst.},
  volume       = {42},
  number       = {3-4},
  pages        = {271--281},
  year         = {2003},
  url          = {https://doi.org/10.1016/S0921-8890(02)00381-0},
  doi          = {10.1016/S0921-8890(02)00381-0},
  timestamp    = {Mon, 24 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ras/PineauMPRT03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/PineauGT03,
  author       = {Joelle Pineau and
                  Geoffrey J. Gordon and
                  Sebastian Thrun},
  editor       = {Georg Gottlob and
                  Toby Walsh},
  title        = {Point-based value iteration: An anytime algorithm for POMDPs},
  booktitle    = {IJCAI-03, Proceedings of the Eighteenth International Joint Conference
                  on Artificial Intelligence, Acapulco, Mexico, August 9-15, 2003},
  pages        = {1025--1032},
  publisher    = {Morgan Kaufmann},
  year         = {2003},
  url          = {http://ijcai.org/Proceedings/03/Papers/147.pdf},
  timestamp    = {Tue, 20 Aug 2019 16:18:41 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/PineauGT03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PineauGT03,
  author       = {Joelle Pineau and
                  Geoffrey J. Gordon and
                  Sebastian Thrun},
  editor       = {Sebastian Thrun and
                  Lawrence K. Saul and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {Applying Metric-Trees to Belief-Point POMDPs},
  booktitle    = {Advances in Neural Information Processing Systems 16 [Neural Information
                  Processing Systems, {NIPS} 2003, December 8-13, 2003, Vancouver and
                  Whistler, British Columbia, Canada]},
  pages        = {759--766},
  publisher    = {{MIT} Press},
  year         = {2003},
  url          = {https://proceedings.neurips.cc/paper/2003/hash/6547884cea64550284728eb26b0947ef-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/PineauGT03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/PineauGT03,
  author       = {Joelle Pineau and
                  Geoffrey J. Gordon and
                  Sebastian Thrun},
  editor       = {Christopher Meek and
                  Uffe Kj{\ae}rulff},
  title        = {Policy-contingent abstraction for robust robot control},
  booktitle    = {{UAI} '03, Proceedings of the 19th Conference in Uncertainty in Artificial
                  Intelligence, Acapulco, Mexico, August 7-10 2003},
  pages        = {477--484},
  publisher    = {Morgan Kaufmann},
  year         = {2003},
  url          = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=964\&\#38;proceeding\_id=19},
  timestamp    = {Wed, 03 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/PineauGT03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MontemerloPRTV02,
  author       = {Michael Montemerlo and
                  Joelle Pineau and
                  Nicholas Roy and
                  Sebastian Thrun and
                  Vandi Verma},
  editor       = {Rina Dechter and
                  Michael J. Kearns and
                  Richard S. Sutton},
  title        = {Experiences with a Mobile Robotic Guide for the Elderly},
  booktitle    = {Proceedings of the Eighteenth National Conference on Artificial Intelligence
                  and Fourteenth Conference on Innovative Applications of Artificial
                  Intelligence, July 28 - August 1, 2002, Edmonton, Alberta, Canada},
  pages        = {587--592},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2002},
  url          = {http://www.aaai.org/Library/AAAI/2002/aaai02-088.php},
  timestamp    = {Tue, 05 Sep 2023 09:10:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/MontemerloPRTV02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amia/MatthewsEMPRRT02,
  author       = {Judith T. Matthews and
                  Sandra Engberg and
                  Michael Montemerlo and
                  Joelle Pineau and
                  Nicholas Roy and
                  Joan Rogers and
                  Sebastian Thrun},
  title        = {Robotic Assistance During Ambulation by Older Adults},
  booktitle    = {{AMIA} 2002, American Medical Informatics Association Annual Symposium,
                  San Antonio, TX, USA, November 9-13, 2002},
  publisher    = {{AMIA}},
  year         = {2002},
  url          = {https://knowledge.amia.org/amia-55142-a2002a-1.610020/t-002-1.611916/f-001-1.611917/a-333-1.612245/a-334-1.612242},
  timestamp    = {Wed, 17 Apr 2024 11:48:33 +0200},
  biburl       = {https://dblp.org/rec/conf/amia/MatthewsEMPRRT02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/RoyPT00,
  author       = {Nicholas Roy and
                  Joelle Pineau and
                  Sebastian Thrun},
  title        = {Spoken Dialogue Management Using Probabilistic Reasoning},
  booktitle    = {38th Annual Meeting of the Association for Computational Linguistics,
                  Hong Kong, China, October 1-8, 2000},
  pages        = {93--100},
  publisher    = {{ACL}},
  year         = {2000},
  url          = {https://aclanthology.org/P00-1013/},
  doi          = {10.3115/1075218.1075231},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/RoyPT00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GoddeauP00,
  author       = {David Goddeau and
                  Joelle Pineau},
  title        = {Fast reinforcement learning of dialog strategies},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing.
                  {ICASSP} 2000, 5-9 June, 2000, Hilton Hotel and Convention Center,
                  Istanbul, Turkey},
  pages        = {1233--1236},
  publisher    = {{IEEE}},
  year         = {2000},
  url          = {https://doi.org/10.1109/ICASSP.2000.859189},
  doi          = {10.1109/ICASSP.2000.859189},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/GoddeauP00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}