default search action
BibTeX records: Joelle Pineau
@inproceedings{DBLP:conf/cslaw/0002HDP24, author = {Peter Henderson and Jieru Hu and Mona T. Diab and Joelle Pineau}, title = {Rethinking Machine Learning Benchmarks in the Context of Professional Codes of Conduct}, booktitle = {Proceedings of the Symposium on Computer Science and Law, {CSLAW} 2024, Boston, MA, USA, March 12-13, 2024}, pages = {109--120}, publisher = {{ACM}}, year = {2024}, url = {https://doi.org/10.1145/3614407.3643708}, doi = {10.1145/3614407.3643708}, timestamp = {Mon, 15 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cslaw/0002HDP24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WabarthaP24, author = {Maxime Wabartha and Joelle Pineau}, title = {Piecewise Linear Parametrization of Policies: Towards Interpretable Deep Reinforcement Learning}, booktitle = {The Twelfth International Conference on Learning Representations, {ICLR} 2024, Vienna, Austria, May 7-11, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=hOMVq57Ce0}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WabarthaP24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KapoorBKLRCHBBB24, author = {Sayash Kapoor and Rishi Bommasani and Kevin Klyman and Shayne Longpre and Ashwin Ramaswami and Peter Cihon and Aspen K. Hopkins and Kevin Bankston and Stella Biderman and Miranda Bogen and Rumman Chowdhury and Alex Engler and Peter Henderson and Yacine Jernite and Seth Lazar and Stefano Maffulli and Alondra Nelson and Joelle Pineau and Aviya Skowron and Dawn Song and Victor Storchan and Daniel Zhang and Daniel E. Ho and Percy Liang and Arvind Narayanan}, title = {Position: On the Societal Impact of Open Foundation Models}, booktitle = {Forty-first International Conference on Machine Learning, {ICML} 2024, Vienna, Austria, July 21-27, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=jRX6yCxFhx}, timestamp = {Mon, 02 Sep 2024 16:45:29 +0200}, biburl = {https://dblp.org/rec/conf/icml/KapoorBKLRCHBBB24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-07918, author = {Sayash Kapoor and Rishi Bommasani and Kevin Klyman and Shayne Longpre and Ashwin Ramaswami and Peter Cihon and Aspen K. Hopkins and Kevin Bankston and Stella Biderman and Miranda Bogen and Rumman Chowdhury and Alex Engler and Peter Henderson and Yacine Jernite and Seth Lazar and Stefano Maffulli and Alondra Nelson and Joelle Pineau and Aviya Skowron and Dawn Song and Victor Storchan and Daniel Zhang and Daniel E. Ho and Percy Liang and Arvind Narayanan}, title = {On the Societal Impact of Open Foundation Models}, journal = {CoRR}, volume = {abs/2403.07918}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.07918}, doi = {10.48550/ARXIV.2403.07918}, eprinttype = {arXiv}, eprint = {2403.07918}, timestamp = {Thu, 29 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-07918.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/eor/CousineauVMP23, author = {Martin Cousineau and Vedat Verter and Susan A. Murphy and Joelle Pineau}, title = {Estimating causal effects with optimization-based methods: {A} review and empirical comparison}, journal = {Eur. J. Oper. Res.}, volume = {304}, number = {2}, pages = {367--380}, year = {2023}, url = {https://doi.org/10.1016/j.ejor.2022.01.046}, doi = {10.1016/J.EJOR.2022.01.046}, timestamp = {Mon, 24 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/eor/CousineauVMP23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/natmi/SrikumarFAACCHJLOP23, author = {Madhulika Srikumar and Rebecca Finlay and Grace Abuhamad and Carolyn Ashurst and Rosie Campbell and Emily Campbell{-}Ratcliffe and Hudson Hongo and Sara R. Jordan and Joseph Lindley and Aviv Ovadya and Joelle Pineau}, title = {Publisher Correction: Advancing ethics review practices in {AI} research}, journal = {Nat. Mac. Intell.}, volume = {5}, number = {1}, pages = {94}, year = {2023}, url = {https://doi.org/10.1038/s42256-023-00608-6}, doi = {10.1038/S42256-023-00608-6}, timestamp = {Fri, 19 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/natmi/SrikumarFAACCHJLOP23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tacl/SachanLYZPZ23, author = {Devendra Singh Sachan and Mike Lewis and Dani Yogatama and Luke Zettlemoyer and Joelle Pineau and Manzil Zaheer}, title = {Questions Are All You Need to Train a Dense Passage Retriever}, journal = {Trans. Assoc. Comput. Linguistics}, volume = {11}, pages = {600--616}, year = {2023}, url = {https://doi.org/10.1162/tacl\_a\_00564}, doi = {10.1162/TACL\_A\_00564}, timestamp = {Wed, 19 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tacl/SachanLYZPZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tmlr/SatijaLPP23, author = {Harsh Satija and Alessandro Lazaric and Matteo Pirotta and Joelle Pineau}, title = {Group Fairness in Reinforcement Learning}, journal = {Trans. Mach. Learn. Res.}, volume = {2023}, year = {2023}, url = {https://openreview.net/forum?id=JkIH4MeOc3}, timestamp = {Thu, 18 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tmlr/SatijaLPP23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aiedu/KochmarVBGSP22, author = {Ekaterina Kochmar and Dung Do Vu and Robert Belfer and Varun Gupta and Iulian Vlad Serban and Joelle Pineau}, title = {Automated Data-Driven Generation of Personalized Pedagogical Interventions in Intelligent Tutoring Systems}, journal = {Int. J. Artif. Intell. Educ.}, volume = {32}, number = {2}, pages = {323--349}, year = {2022}, url = {https://doi.org/10.1007/s40593-021-00267-x}, doi = {10.1007/S40593-021-00267-X}, timestamp = {Mon, 08 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aiedu/KochmarVBGSP22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/MazoureDLMPPR22, author = {Bogdan Mazoure and Thang Doan and Tianyu Li and Vladimir Makarenkov and Joelle Pineau and Doina Precup and Guillaume Rabusseau}, title = {Low-Rank Representation of Reinforcement Learning Policies}, journal = {J. Artif. Intell. Res.}, volume = {75}, pages = {597--636}, year = {2022}, url = {https://doi.org/10.1613/jair.1.13854}, doi = {10.1613/JAIR.1.13854}, timestamp = {Sat, 05 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jair/MazoureDLMPPR22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/natmi/SrikumarFAACCHJLOP22, author = {Madhulika Srikumar and Rebecca Finlay and Grace Abuhamad and Carolyn Ashurst and Rosie Campbell and Emily Campbell{-}Ratcliffe and Hudson Hongo and Sara R. Jordan and Joseph Lindley and Aviv Ovadya and Joelle Pineau}, title = {Advancing ethics review practices in {AI} research}, journal = {Nat. Mac. Intell.}, volume = {4}, number = {12}, pages = {1061--1064}, year = {2022}, url = {https://doi.org/10.1038/s42256-022-00585-2}, doi = {10.1038/S42256-022-00585-2}, timestamp = {Wed, 17 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/natmi/SrikumarFAACCHJLOP22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/GX-ChenCRP22, author = {Anthony GX{-}Chen and Veronica Chelu and Blake A. Richards and Joelle Pineau}, title = {A Generalized Bootstrap Target for Value-Learning, Efficiently Combining Value and Feature Predictions}, booktitle = {Thirty-Sixth {AAAI} Conference on Artificial Intelligence, {AAAI} 2022, Thirty-Fourth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2022, The Twelveth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2022 Virtual Event, February 22 - March 1, 2022}, pages = {6829--6837}, publisher = {{AAAI} Press}, year = {2022}, url = {https://doi.org/10.1609/aaai.v36i6.20639}, doi = {10.1609/AAAI.V36I6.20639}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/GX-ChenCRP22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/SachanLJAYPZ22, author = {Devendra Singh Sachan and Mike Lewis and Mandar Joshi and Armen Aghajanyan and Wen{-}tau Yih and Joelle Pineau and Luke Zettlemoyer}, editor = {Yoav Goldberg and Zornitsa Kozareva and Yue Zhang}, title = {Improving Passage Retrieval with Zero-Shot Question Generation}, booktitle = {Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022}, pages = {3781--3797}, publisher = {Association for Computational Linguistics}, year = {2022}, url = {https://doi.org/10.18653/v1/2022.emnlp-main.249}, doi = {10.18653/V1/2022.EMNLP-MAIN.249}, timestamp = {Thu, 10 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/SachanLJAYPZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/SinhaKRPHW22, author = {Koustuv Sinha and Amirhossein Kazemnejad and Siva Reddy and Joelle Pineau and Dieuwke Hupkes and Adina Williams}, editor = {Yoav Goldberg and Zornitsa Kozareva and Yue Zhang}, title = {The Curious Case of Absolute Position Embeddings}, booktitle = {Findings of the Association for Computational Linguistics: {EMNLP} 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022}, pages = {4449--4472}, publisher = {Association for Computational Linguistics}, year = {2022}, url = {https://doi.org/10.18653/v1/2022.findings-emnlp.326}, doi = {10.18653/V1/2022.FINDINGS-EMNLP.326}, timestamp = {Thu, 10 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/SinhaKRPHW22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/CacciaAATPB22, author = {Lucas Caccia and Rahaf Aljundi and Nader Asadi and Tinne Tuytelaars and Joelle Pineau and Eugene Belilovsky}, title = {New Insights on Reducing Abrupt Representation Change in Online Continual Learning}, booktitle = {The Tenth International Conference on Learning Representations, {ICLR} 2022, Virtual Event, April 25-29, 2022}, publisher = {OpenReview.net}, year = {2022}, url = {https://openreview.net/forum?id=N8MaByOzUfb}, timestamp = {Sat, 20 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/CacciaAATPB22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/XieSFP022, author = {Annie Xie and Shagun Sodhani and Chelsea Finn and Joelle Pineau and Amy Zhang}, editor = {Kamalika Chaudhuri and Stefanie Jegelka and Le Song and Csaba Szepesv{\'{a}}ri and Gang Niu and Sivan Sabato}, title = {Robust Policy Learning over Multiple Uncertainty Sets}, booktitle = {International Conference on Machine Learning, {ICML} 2022, 17-23 July 2022, Baltimore, Maryland, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {162}, pages = {24414--24429}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v162/xie22c.html}, timestamp = {Tue, 12 Jul 2022 17:36:52 +0200}, biburl = {https://dblp.org/rec/conf/icml/XieSFP022.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/l4dc/SodhaniMP022, author = {Shagun Sodhani and Franziska Meier and Joelle Pineau and Amy Zhang}, editor = {Roya Firoozi and Negar Mehr and Esen Yel and Rika Antonova and Jeannette Bohg and Mac Schwager and Mykel J. Kochenderfer}, title = {Block Contextual MDPs for Continual Learning}, booktitle = {Learning for Dynamics and Control Conference, {L4DC} 2022, 23-24 June 2022, Stanford University, Stanford, CA, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {168}, pages = {608--623}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v168/sodhani22a.html}, timestamp = {Fri, 20 May 2022 14:36:40 +0200}, biburl = {https://dblp.org/rec/conf/l4dc/SodhaniMP022.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2201-01836, author = {Anthony GX{-}Chen and Veronica Chelu and Blake A. Richards and Joelle Pineau}, title = {A Generalized Bootstrap Target for Value-Learning, Efficiently Combining Value and Feature Predictions}, journal = {CoRR}, volume = {abs/2201.01836}, year = {2022}, url = {https://arxiv.org/abs/2201.01836}, eprinttype = {arXiv}, eprint = {2201.01836}, timestamp = {Mon, 10 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2201-01836.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-07013, author = {Annie Xie and Shagun Sodhani and Chelsea Finn and Joelle Pineau and Amy Zhang}, title = {Robust Policy Learning over Multiple Uncertainty Sets}, journal = {CoRR}, volume = {abs/2202.07013}, year = {2022}, url = {https://arxiv.org/abs/2202.07013}, eprinttype = {arXiv}, eprint = {2202.07013}, timestamp = {Fri, 18 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-07013.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-09826, author = {Thang Doan and Seyed{-}Iman Mirzadeh and Joelle Pineau and Mehrdad Farajtabar}, title = {Efficient Continual Learning Ensembles in Neural Network Subspaces}, journal = {CoRR}, volume = {abs/2202.09826}, year = {2022}, url = {https://arxiv.org/abs/2202.09826}, eprinttype = {arXiv}, eprint = {2202.09826}, timestamp = {Tue, 01 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-09826.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-00097, author = {Martin Cousineau and Vedat Verter and Susan A. Murphy and Joelle Pineau}, title = {Estimating causal effects with optimization-based methods: {A} review and empirical comparison}, journal = {CoRR}, volume = {abs/2203.00097}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.00097}, doi = {10.48550/ARXIV.2203.00097}, eprinttype = {arXiv}, eprint = {2203.00097}, timestamp = {Wed, 16 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-00097.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2204-07496, author = {Devendra Singh Sachan and Mike Lewis and Mandar Joshi and Armen Aghajanyan and Wen{-}tau Yih and Joelle Pineau and Luke Zettlemoyer}, title = {Improving Passage Retrieval with Zero-Shot Question Generation}, journal = {CoRR}, volume = {abs/2204.07496}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2204.07496}, doi = {10.48550/ARXIV.2204.07496}, eprinttype = {arXiv}, eprint = {2204.07496}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2204-07496.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-10658, author = {Devendra Singh Sachan and Mike Lewis and Dani Yogatama and Luke Zettlemoyer and Joelle Pineau and Manzil Zaheer}, title = {Questions Are All You Need to Train a Dense Passage Retriever}, journal = {CoRR}, volume = {abs/2206.10658}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.10658}, doi = {10.48550/ARXIV.2206.10658}, eprinttype = {arXiv}, eprint = {2206.10658}, timestamp = {Mon, 27 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-10658.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-12574, author = {Koustuv Sinha and Amirhossein Kazemnejad and Siva Reddy and Joelle Pineau and Dieuwke Hupkes and Adina Williams}, title = {The Curious Case of Absolute Position Embeddings}, journal = {CoRR}, volume = {abs/2210.12574}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.12574}, doi = {10.48550/ARXIV.2210.12574}, eprinttype = {arXiv}, eprint = {2210.12574}, timestamp = {Fri, 28 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-12574.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/PineauVSLBdFL21, author = {Joelle Pineau and Philippe Vincent{-}Lamarre and Koustuv Sinha and Vincent Larivi{\`{e}}re and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Hugo Larochelle}, title = {Improving Reproducibility in Machine Learning Research(A Report from the NeurIPS 2019 Reproducibility Program)}, journal = {J. Mach. Learn. Res.}, volume = {22}, pages = {164:1--164:20}, year = {2021}, url = {https://jmlr.org/papers/v22/20-303.html}, timestamp = {Wed, 11 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/PineauVSLBdFL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/Yarats0KAPF21, author = {Denis Yarats and Amy Zhang and Ilya Kostrikov and Brandon Amos and Joelle Pineau and Rob Fergus}, title = {Improving Sample Efficiency in Model-Free Reinforcement Learning from Images}, booktitle = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9, 2021}, pages = {10674--10681}, publisher = {{AAAI} Press}, year = {2021}, url = {https://doi.org/10.1609/aaai.v35i12.17276}, doi = {10.1609/AAAI.V35I12.17276}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/Yarats0KAPF21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/SinhaPPW20, author = {Koustuv Sinha and Prasanna Parthasarathi and Joelle Pineau and Adina Williams}, editor = {Chengqing Zong and Fei Xia and Wenjie Li and Roberto Navigli}, title = {UnNatural Language Inference}, booktitle = {Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021}, pages = {7329--7346}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.acl-long.569}, doi = {10.18653/V1/2021.ACL-LONG.569}, timestamp = {Mon, 09 Aug 2021 16:25:37 +0200}, biburl = {https://dblp.org/rec/conf/acl/SinhaPPW20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/Romoff0KBTBP21, author = {Joshua Romoff and Peter Henderson and David Kanaa and Emmanuel Bengio and Ahmed Touati and Pierre{-}Luc Bacon and Joelle Pineau}, editor = {Frank Dignum and Alessio Lomuscio and Ulle Endriss and Ann Now{\'{e}}}, title = {TDprop: Does Adaptive Optimization With Jacobi Preconditioning Help Temporal Difference Learning?}, booktitle = {{AAMAS} '21: 20th International Conference on Autonomous Agents and Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021}, pages = {1082--1090}, publisher = {{ACM}}, year = {2021}, url = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p1082.pdf}, doi = {10.5555/3463952.3464078}, timestamp = {Wed, 20 Jul 2022 17:03:47 +0200}, biburl = {https://dblp.org/rec/conf/atal/Romoff0KBTBP21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eacl/JamborTPH21, author = {Dora Jambor and Komal K. Teru and Joelle Pineau and William L. Hamilton}, editor = {Paola Merlo and J{\"{o}}rg Tiedemann and Reut Tsarfaty}, title = {Exploring the Limits of Few-Shot Link Prediction in Knowledge Graphs}, booktitle = {Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume, {EACL} 2021, Online, April 19 - 23, 2021}, pages = {2816--2822}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.eacl-main.245}, doi = {10.18653/V1/2021.EACL-MAIN.245}, timestamp = {Thu, 20 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/eacl/JamborTPH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/SinhaJHPWK21, author = {Koustuv Sinha and Robin Jia and Dieuwke Hupkes and Joelle Pineau and Adina Williams and Douwe Kiela}, editor = {Marie{-}Francine Moens and Xuanjing Huang and Lucia Specia and Scott Wen{-}tau Yih}, title = {Masked Language Modeling and the Distributional Hypothesis: Order Word Matters Pre-training for Little}, booktitle = {Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican Republic, 7-11 November, 2021}, pages = {2888--2913}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.emnlp-main.230}, doi = {10.18653/V1/2021.EMNLP-MAIN.230}, timestamp = {Fri, 16 Feb 2024 08:27:36 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/SinhaJHPWK21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ParthasarathiSP21, author = {Prasanna Parthasarathi and Koustuv Sinha and Joelle Pineau and Adina Williams}, editor = {Marie{-}Francine Moens and Xuanjing Huang and Lucia Specia and Scott Wen{-}tau Yih}, title = {Sometimes We Want Ungrammatical Translations}, booktitle = {Findings of the Association for Computational Linguistics: {EMNLP} 2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November, 2021}, pages = {3205--3227}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.findings-emnlp.275}, doi = {10.18653/V1/2021.FINDINGS-EMNLP.275}, timestamp = {Fri, 16 Feb 2024 08:27:36 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/ParthasarathiSP21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/0001SKP21, author = {Amy Zhang and Shagun Sodhani and Khimya Khetarpal and Joelle Pineau}, title = {Learning Robust State Abstractions for Hidden-Parameter Block MDPs}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=fmOOI2a3tQP}, timestamp = {Wed, 23 Jun 2021 17:36:39 +0200}, biburl = {https://dblp.org/rec/conf/iclr/0001SKP21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/JeonSBDNP21, author = {Wonseok Jeon and Chen{-}Yang Su and Paul Barde and Thang Doan and Derek Nowrouzezahrai and Joelle Pineau}, title = {Regularized Inverse Reinforcement Learning}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=HgLO8yalfwc}, timestamp = {Wed, 23 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/JeonSBDNP21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/0004JLPK21, author = {Jongmin Lee and Wonseok Jeon and Byung{-}Jun Lee and Joelle Pineau and Kee{-}Eung Kim}, editor = {Marina Meila and Tong Zhang}, title = {OptiDICE: Offline Policy Optimization via Stationary Distribution Correction Estimation}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {6120--6130}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/lee21f.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/0004JLPK21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/Sodhani0P21, author = {Shagun Sodhani and Amy Zhang and Joelle Pineau}, editor = {Marina Meila and Tong Zhang}, title = {Multi-Task Reinforcement Learning with Context-based Representations}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {9767--9779}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/sodhani21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/Sodhani0P21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SatijaTPL21, author = {Harsh Satija and Philip S. Thomas and Joelle Pineau and Romain Laroche}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Multi-Objective {SPIBB:} Seldonian Offline Policy Improvement with Safety Constraints in Finite MDPs}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {2004--2017}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/0f65caf0a7d00afd2b87c028e88fe931-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/SatijaTPL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigdial/ParthasarathiAC21, author = {Prasanna Parthasarathi and Mohamed A. Abdelsalam and Sarath Chandar and Joelle Pineau}, editor = {Haizhou Li and Gina{-}Anne Levow and Zhou Yu and Chitralekha Gupta and Berrak Sisman and Siqi Cai and David Vandyke and Nina Dethlefs and Yan Wu and Junyi Jessy Li}, title = {A Brief Study on the Effects of Training Generative Dialogue Models with a Semantic loss}, booktitle = {Proceedings of the 22nd Annual Meeting of the Special Interest Group on Discourse and Dialogue, SIGdial 2021, Singapore and Online, July 29-31, 2021}, pages = {469--476}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.sigdial-1.49}, doi = {10.18653/V1/2021.SIGDIAL-1.49}, timestamp = {Thu, 15 Aug 2024 07:54:16 +0200}, biburl = {https://dblp.org/rec/conf/sigdial/ParthasarathiAC21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigdial/ParthasarathiPC21, author = {Prasanna Parthasarathi and Joelle Pineau and Sarath Chandar}, editor = {Haizhou Li and Gina{-}Anne Levow and Zhou Yu and Chitralekha Gupta and Berrak Sisman and Siqi Cai and David Vandyke and Nina Dethlefs and Yan Wu and Junyi Jessy Li}, title = {Do Encoder Representations of Generative Dialogue Models have sufficient summary of the Information about the task ?}, booktitle = {Proceedings of the 22nd Annual Meeting of the Special Interest Group on Discourse and Dialogue, SIGdial 2021, Singapore and Online, July 29-31, 2021}, pages = {477--488}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.sigdial-1.50}, doi = {10.18653/V1/2021.SIGDIAL-1.50}, timestamp = {Fri, 12 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sigdial/ParthasarathiPC21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/wcssl/CacciaP21, author = {Lucas Caccia and Joelle Pineau}, editor = {Fabio Cuzzolin and Kevin Cannons and Vincenzo Lomonaco}, title = {SPeCiaL: Self-supervised Pretraining for Continual Learning}, booktitle = {Continual Semi-Supervised Learning - First International Workshop, {CSSL} 2021, Virtual Event, August 19-20, 2021, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {13418}, pages = {91--103}, publisher = {Springer}, year = {2021}, url = {https://doi.org/10.1007/978-3-031-17587-9\_7}, doi = {10.1007/978-3-031-17587-9\_7}, timestamp = {Fri, 07 Oct 2022 15:35:11 +0200}, biburl = {https://dblp.org/rec/conf/wcssl/CacciaP21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:series/lncs/DelacroixPM21, author = {Sylvie Delacroix and Joelle Pineau and Jessica Montgomery}, editor = {Bertrand Braunschweig and Malik Ghallab}, title = {Democratising the Digital Revolution: The Role of Data Governance}, booktitle = {Reflections on Artificial Intelligence for Humanity}, series = {Lecture Notes in Computer Science}, volume = {12600}, pages = {40--52}, publisher = {Springer}, year = {2021}, url = {https://doi.org/10.1007/978-3-030-69128-8\_3}, doi = {10.1007/978-3-030-69128-8\_3}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/series/lncs/DelacroixPM21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2101-00010, author = {Koustuv Sinha and Prasanna Parthasarathi and Joelle Pineau and Adina Williams}, title = {Unnatural Language Inference}, journal = {CoRR}, volume = {abs/2101.00010}, year = {2021}, url = {https://arxiv.org/abs/2101.00010}, eprinttype = {arXiv}, eprint = {2101.00010}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2101-00010.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2101-04909, author = {Anuroop Sriram and Matthew J. Muckley and Koustuv Sinha and Farah Shamout and Joelle Pineau and Krzysztof J. Geras and Lea Azour and Yindalon Aphinyanaphongs and Nafissa Yakubova and William Moore}, title = {{COVID-19} Prognosis via Self-Supervised Representation Learning and Multi-Image Prediction}, journal = {CoRR}, volume = {abs/2101.04909}, year = {2021}, url = {https://arxiv.org/abs/2101.04909}, eprinttype = {arXiv}, eprint = {2101.04909}, timestamp = {Sat, 30 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2101-04909.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-03419, author = {Dora Jambor and Komal K. Teru and Joelle Pineau and William L. Hamilton}, title = {Exploring the Limits of Few-Shot Link Prediction in Knowledge Graphs}, journal = {CoRR}, volume = {abs/2102.03419}, year = {2021}, url = {https://arxiv.org/abs/2102.03419}, eprinttype = {arXiv}, eprint = {2102.03419}, timestamp = {Wed, 10 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-03419.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-06177, author = {Shagun Sodhani and Amy Zhang and Joelle Pineau}, title = {Multi-Task Reinforcement Learning with Context-based Representations}, journal = {CoRR}, volume = {abs/2102.06177}, year = {2021}, url = {https://arxiv.org/abs/2102.06177}, eprinttype = {arXiv}, eprint = {2102.06177}, timestamp = {Thu, 18 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-06177.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-07097, author = {Bonnie Li and Vincent Fran{\c{c}}ois{-}Lavet and Thang Doan and Joelle Pineau}, title = {Domain Adversarial Reinforcement Learning}, journal = {CoRR}, volume = {abs/2102.07097}, year = {2021}, url = {https://arxiv.org/abs/2102.07097}, eprinttype = {arXiv}, eprint = {2102.07097}, timestamp = {Thu, 18 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-07097.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-09850, author = {Manan Tomar and Amy Zhang and Roberto Calandra and Matthew E. Taylor and Joelle Pineau}, title = {Model-Invariant State Abstractions for Model-Based Reinforcement Learning}, journal = {CoRR}, volume = {abs/2102.09850}, year = {2021}, url = {https://arxiv.org/abs/2102.09850}, eprinttype = {arXiv}, eprint = {2102.09850}, timestamp = {Wed, 24 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-09850.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2103-08067, author = {Kalesha Bullard and Douwe Kiela and Joelle Pineau and Jakob N. Foerster}, title = {Quasi-Equivalence Discovery for Zero-Shot Emergent Communication}, journal = {CoRR}, volume = {abs/2103.08067}, year = {2021}, url = {https://arxiv.org/abs/2103.08067}, eprinttype = {arXiv}, eprint = {2103.08067}, timestamp = {Tue, 23 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2103-08067.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-05025, author = {Lucas Caccia and Rahaf Aljundi and Tinne Tuytelaars and Joelle Pineau and Eugene Belilovsky}, title = {Reducing Representation Drift in Online Continual Learning}, journal = {CoRR}, volume = {abs/2104.05025}, year = {2021}, url = {https://arxiv.org/abs/2104.05025}, eprinttype = {arXiv}, eprint = {2104.05025}, timestamp = {Mon, 19 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-05025.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-06644, author = {Koustuv Sinha and Robin Jia and Dieuwke Hupkes and Joelle Pineau and Adina Williams and Douwe Kiela}, title = {Masked Language Modeling and the Distributional Hypothesis: Order Word Matters Pre-training for Little}, journal = {CoRR}, volume = {abs/2104.06644}, year = {2021}, url = {https://arxiv.org/abs/2104.06644}, eprinttype = {arXiv}, eprint = {2104.06644}, timestamp = {Mon, 19 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-06644.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-07623, author = {Prasanna Parthasarathi and Koustuv Sinha and Joelle Pineau and Adina Williams}, title = {Sometimes We Want Translationese}, journal = {CoRR}, volume = {abs/2104.07623}, year = {2021}, url = {https://arxiv.org/abs/2104.07623}, eprinttype = {arXiv}, eprint = {2104.07623}, timestamp = {Mon, 19 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-07623.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-00099, author = {Harsh Satija and Philip S. Thomas and Joelle Pineau and Romain Laroche}, title = {Multi-Objective {SPIBB:} Seldonian Offline Policy Improvement with Safety Constraints in Finite MDPs}, journal = {CoRR}, volume = {abs/2106.00099}, year = {2021}, url = {https://arxiv.org/abs/2106.00099}, eprinttype = {arXiv}, eprint = {2106.00099}, timestamp = {Wed, 09 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-00099.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-03955, author = {Emmanuel Bengio and Joelle Pineau and Doina Precup}, title = {Correcting Momentum in Temporal Difference Learning}, journal = {CoRR}, volume = {abs/2106.03955}, year = {2021}, url = {https://arxiv.org/abs/2106.03955}, eprinttype = {arXiv}, eprint = {2106.03955}, timestamp = {Thu, 10 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-03955.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-09065, author = {Lucas Caccia and Joelle Pineau}, title = {SPeCiaL: Self-Supervised Pretraining for Continual Learning}, journal = {CoRR}, volume = {abs/2106.09065}, year = {2021}, url = {https://arxiv.org/abs/2106.09065}, eprinttype = {arXiv}, eprint = {2106.09065}, timestamp = {Tue, 29 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-09065.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-10619, author = {Prasanna Parthasarathi and Mohamed A. Abdelsalam and Joelle Pineau and Sarath Chandar}, title = {A Brief Study on the Effects of Training Generative Dialogue Models with a Semantic loss}, journal = {CoRR}, volume = {abs/2106.10619}, year = {2021}, url = {https://arxiv.org/abs/2106.10619}, eprinttype = {arXiv}, eprint = {2106.10619}, timestamp = {Tue, 09 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-10619.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-10622, author = {Prasanna Parthasarathi and Joelle Pineau and Sarath Chandar}, title = {Do Encoder Representations of Generative Dialogue Models Encode Sufficient Information about the Task ?}, journal = {CoRR}, volume = {abs/2106.10622}, year = {2021}, url = {https://arxiv.org/abs/2106.10622}, eprinttype = {arXiv}, eprint = {2106.10622}, timestamp = {Tue, 29 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-10622.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-10783, author = {Jongmin Lee and Wonseok Jeon and Byung{-}Jun Lee and Joelle Pineau and Kee{-}Eung Kim}, title = {OptiDICE: Offline Policy Optimization via Stationary Distribution Correction Estimation}, journal = {CoRR}, volume = {abs/2106.10783}, year = {2021}, url = {https://arxiv.org/abs/2106.10783}, eprinttype = {arXiv}, eprint = {2106.10783}, timestamp = {Wed, 30 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-10783.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-06972, author = {Shagun Sodhani and Franziska Meier and Joelle Pineau and Amy Zhang}, title = {Block Contextual MDPs for Continual Learning}, journal = {CoRR}, volume = {abs/2110.06972}, year = {2021}, url = {https://arxiv.org/abs/2110.06972}, eprinttype = {arXiv}, eprint = {2110.06972}, timestamp = {Fri, 22 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-06972.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/SerbanSPPB20, author = {Iulian Vlad Serban and Chinnadhurai Sankar and Michael Pieper and Joelle Pineau and Yoshua Bengio}, title = {The Bottleneck Simulator: {A} Model-Based Deep Reinforcement Learning Approach}, journal = {J. Artif. Intell. Res.}, volume = {69}, pages = {571--612}, year = {2020}, url = {https://doi.org/10.1613/jair.1.12463}, doi = {10.1613/JAIR.1.12463}, timestamp = {Fri, 06 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jair/SerbanSPPB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/natmi/Peiffer-SmadjaM20, author = {Nathan Peiffer{-}Smadja and Redwan Maatoug and Fran{\c{c}}ois{-}Xavier Lescure and Eric D'ortenzio and Joelle Pineau and Jean{-}R{\'{e}}mi King}, title = {Machine Learning for {COVID-19} needs global collaboration and data-sharing}, journal = {Nat. Mach. Intell.}, volume = {2}, number = {6}, pages = {293--294}, year = {2020}, url = {https://doi.org/10.1038/s42256-020-0181-6}, doi = {10.1038/S42256-020-0181-6}, timestamp = {Wed, 15 Dec 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/natmi/Peiffer-SmadjaM20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/CrawfordP20, author = {Eric Crawford and Joelle Pineau}, title = {Exploiting Spatial Invariance for Scalable Unsupervised Object Tracking}, booktitle = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI} 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA, February 7-12, 2020}, pages = {3684--3692}, publisher = {{AAAI} Press}, year = {2020}, url = {https://doi.org/10.1609/aaai.v34i04.5777}, doi = {10.1609/AAAI.V34I04.5777}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/CrawfordP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/ZhangDP20, author = {Qizhen Zhang and Audrey Durand and Joelle Pineau}, title = {Literature Mining for Incorporating Inductive Bias in Biomedical Prediction Tasks (Student Abstract)}, booktitle = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI} 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA, February 7-12, 2020}, pages = {13983--13984}, publisher = {{AAAI} Press}, year = {2020}, url = {https://doi.org/10.1609/aaai.v34i10.7264}, doi = {10.1609/AAAI.V34I10.7264}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/ZhangDP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/SinhaPWLHP20, author = {Koustuv Sinha and Prasanna Parthasarathi and Jasmine Wang and Ryan Lowe and William L. Hamilton and Joelle Pineau}, editor = {Dan Jurafsky and Joyce Chai and Natalie Schluter and Joel R. Tetreault}, title = {Learning an Unreferenced Metric for Online Dialogue Evaluation}, booktitle = {Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, {ACL} 2020, Online, July 5-10, 2020}, pages = {2430--2441}, publisher = {Association for Computational Linguistics}, year = {2020}, url = {https://doi.org/10.18653/v1/2020.acl-main.220}, doi = {10.18653/V1/2020.ACL-MAIN.220}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/SinhaPWLHP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aied/KochmarVBGSP20, author = {Ekaterina Kochmar and Dung Do Vu and Robert Belfer and Varun Gupta and Iulian Vlad Serban and Joelle Pineau}, editor = {Ig Ibert Bittencourt and Mutlu Cukurova and Kasia Muldner and Rose Luckin and Eva Mill{\'{a}}n}, title = {Automated Personalized Feedback Improves Learning Gains in An Intelligent Tutoring System}, booktitle = {Artificial Intelligence in Education - 21st International Conference, {AIED} 2020, Ifrane, Morocco, July 6-10, 2020, Proceedings, Part {II}}, series = {Lecture Notes in Computer Science}, volume = {12164}, pages = {140--146}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-52240-7\_26}, doi = {10.1007/978-3-030-52240-7\_26}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aied/KochmarVBGSP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aied/SerbanGKVBPCCB20, author = {Iulian Vlad Serban and Varun Gupta and Ekaterina Kochmar and Dung Do Vu and Robert Belfer and Joelle Pineau and Aaron C. Courville and Laurent Charlin and Yoshua Bengio}, editor = {Ig Ibert Bittencourt and Mutlu Cukurova and Kasia Muldner and Rose Luckin and Eva Mill{\'{a}}n}, title = {A Large-Scale, Open-Domain, Mixed-Interface Dialogue-Based {ITS} for {STEM}}, booktitle = {Artificial Intelligence in Education - 21st International Conference, {AIED} 2020, Ifrane, Morocco, July 6-10, 2020, Proceedings, Part {II}}, series = {Lecture Notes in Computer Science}, volume = {12164}, pages = {387--392}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-52240-7\_70}, doi = {10.1007/978-3-030-52240-7\_70}, timestamp = {Tue, 07 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aied/SerbanGKVBPCCB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/debs/Pineau20, author = {Joelle Pineau}, editor = {Julien Gascon{-}Samson and Kaiwen Zhang and Khuzaima Daudjee and Bettina Kemme}, title = {Building reproducible, reusable, and robust machine learning software}, booktitle = {14th {ACM} International Conference on Distributed and Event-based Systems, {DEBS} 2020, Montreal, Quebec, Canada, July 13-17, 2020}, pages = {2}, publisher = {{ACM}}, year = {2020}, url = {https://doi.org/10.1145/3401025.3407941}, doi = {10.1145/3401025.3407941}, timestamp = {Wed, 20 Jul 2022 14:24:56 +0200}, biburl = {https://dblp.org/rec/conf/debs/Pineau20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/CacciaCFLPC20, author = {Massimo Caccia and Lucas Caccia and William Fedus and Hugo Larochelle and Joelle Pineau and Laurent Charlin}, title = {Language GANs Falling Short}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=BJgza6VtPB}, timestamp = {Thu, 07 May 2020 17:11:47 +0200}, biburl = {https://dblp.org/rec/conf/iclr/CacciaCFLPC20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/Lowe0FKP20, author = {Ryan Lowe and Abhinav Gupta and Jakob N. Foerster and Douwe Kiela and Joelle Pineau}, title = {On the interaction between supervision and self-play in emergent communication}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=rJxGLlBtwH}, timestamp = {Thu, 07 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/Lowe0FKP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/BengioPP20, author = {Emmanuel Bengio and Joelle Pineau and Doina Precup}, title = {Interference and Generalization in Temporal Difference Learning}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {767--777}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/bengio20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/BengioPP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/CacciaBCP20, author = {Lucas Caccia and Eugene Belilovsky and Massimo Caccia and Joelle Pineau}, title = {Online Learned Continual Compression with Adaptive Quantization Modules}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {1240--1250}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/caccia20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/CacciaBCP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/SatijaAP20, author = {Harsh Satija and Philip Amortila and Joelle Pineau}, title = {Constrained Markov Decision Processes via Backward Value Functions}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {8502--8511}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/satija20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/SatijaAP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/0001LSFKPGP20, author = {Amy Zhang and Clare Lyle and Shagun Sodhani and Angelos Filos and Marta Kwiatkowska and Joelle Pineau and Yarin Gal and Doina Precup}, title = {Invariant Causal Prediction for Block MDPs}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {11214--11224}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/zhang20t.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/0001LSFKPGP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/WabarthaDFP20, author = {Maxime Wabartha and Audrey Durand and Vincent Fran{\c{c}}ois{-}Lavet and Joelle Pineau}, editor = {Christian Bessiere}, title = {Handling Black Swan Events in Deep Learning with Diversely Extrapolated Neural Networks}, booktitle = {Proceedings of the Twenty-Ninth International Joint Conference on Artificial Intelligence, {IJCAI} 2020}, pages = {2140--2147}, publisher = {ijcai.org}, year = {2020}, url = {https://doi.org/10.24963/ijcai.2020/296}, doi = {10.24963/IJCAI.2020/296}, timestamp = {Mon, 20 Jul 2020 12:38:52 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/WabarthaDFP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/Francois-LavetR20, author = {Vincent Fran{\c{c}}ois{-}Lavet and Guillaume Rabusseau and Joelle Pineau and Damien Ernst and Raphael Fonteneau}, editor = {Christian Bessiere}, title = {On Overfitting and Asymptotic Bias in Batch Reinforcement Learning with Partial Observability (Extended Abstract)}, booktitle = {Proceedings of the Twenty-Ninth International Joint Conference on Artificial Intelligence, {IJCAI} 2020}, pages = {5055--5059}, publisher = {ijcai.org}, year = {2020}, url = {https://doi.org/10.24963/ijcai.2020/706}, doi = {10.24963/IJCAI.2020/706}, timestamp = {Wed, 15 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/Francois-LavetR20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/l4dc/Yang0MPAC20, author = {Ge Yang and Amy Zhang and Ari S. Morcos and Joelle Pineau and Pieter Abbeel and Roberto Calandra}, editor = {Alexandre M. Bayen and Ali Jadbabaie and George J. Pappas and Pablo A. Parrilo and Benjamin Recht and Claire J. Tomlin and Melanie N. Zeilinger}, title = {Plan2Vec: Unsupervised Representation Learning by Latent Plans}, booktitle = {Proceedings of the 2nd Annual Conference on Learning for Dynamics and Control, {L4DC} 2020, Online Event, Berkeley, CA, USA, 11-12 June 2020}, series = {Proceedings of Machine Learning Research}, volume = {120}, pages = {935--946}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v120/yang20b.html}, timestamp = {Fri, 07 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/l4dc/Yang0MPAC20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BardeRJPPN20, author = {Paul Barde and Julien Roy and Wonseok Jeon and Joelle Pineau and Chris Pal and Derek Nowrouzezahrai}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Adversarial Soft Advantage Fitting: Imitation Learning without Policy Optimization}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/9161ab7a1b61012c4c303f10b4c16b2c-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/BardeRJPPN20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/TaoFP20, author = {Ruo Yu Tao and Vincent Fran{\c{c}}ois{-}Lavet and Joelle Pineau}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Novelty Search in Representational Space for Sample Efficient Exploration}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/5ca41a86596a5ed567d15af0be224952-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/TaoFP20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uai/Touati0PV20, author = {Ahmed Touati and Amy Zhang and Joelle Pineau and Pascal Vincent}, editor = {Ryan P. Adams and Vibhav Gogate}, title = {Stable Policy Optimization via Off-Policy Divergence Regularization}, booktitle = {Proceedings of the Thirty-Sixth Conference on Uncertainty in Artificial Intelligence, {UAI} 2020, virtual online, August 3-6, 2020}, series = {Proceedings of Machine Learning Research}, volume = {124}, pages = {1328--1337}, publisher = {{AUAI} Press}, year = {2020}, url = {http://proceedings.mlr.press/v124/touati20a.html}, timestamp = {Tue, 07 May 2024 20:09:01 +0200}, biburl = {https://dblp.org/rec/conf/uai/Touati0PV20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-01093, author = {Ryan Lowe and Abhinav Gupta and Jakob N. Foerster and Douwe Kiela and Joelle Pineau}, title = {On the interaction between supervision and self-play in emergent communication}, journal = {CoRR}, volume = {abs/2002.01093}, year = {2020}, url = {https://arxiv.org/abs/2002.01093}, eprinttype = {arXiv}, eprint = {2002.01093}, timestamp = {Mon, 15 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-01093.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-02863, author = {Bogdan Mazoure and Thang Doan and Tianyu Li and Vladimir Makarenkov and Joelle Pineau and Doina Precup and Guillaume Rabusseau}, title = {Provably efficient reconstruction of policy networks}, journal = {CoRR}, volume = {abs/2002.02863}, year = {2020}, url = {https://arxiv.org/abs/2002.02863}, eprinttype = {arXiv}, eprint = {2002.02863}, timestamp = {Mon, 10 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-02863.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-05651, author = {Peter Henderson and Jieru Hu and Joshua Romoff and Emma Brunskill and Dan Jurafsky and Joelle Pineau}, title = {Towards the Systematic Reporting of the Energy and Carbon Footprints of Machine Learning}, journal = {CoRR}, volume = {abs/2002.05651}, year = {2020}, url = {https://arxiv.org/abs/2002.05651}, eprinttype = {arXiv}, eprint = {2002.05651}, timestamp = {Fri, 14 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-05651.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-10525, author = {Wonseok Jeon and Paul Barde and Derek Nowrouzezahrai and Joelle Pineau}, title = {Scalable Multi-Agent Inverse Reinforcement Learning via Actor-Attention-Critic}, journal = {CoRR}, volume = {abs/2002.10525}, year = {2020}, url = {https://arxiv.org/abs/2002.10525}, eprinttype = {arXiv}, eprint = {2002.10525}, timestamp = {Tue, 03 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-10525.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-04108, author = {Ahmed Touati and Amy Zhang and Joelle Pineau and Pascal Vincent}, title = {Stable Policy Optimization via Off-Policy Divergence Regularization}, journal = {CoRR}, volume = {abs/2003.04108}, year = {2020}, url = {https://arxiv.org/abs/2003.04108}, eprinttype = {arXiv}, eprint = {2003.04108}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-04108.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-06016, author = {Amy Zhang and Clare Lyle and Shagun Sodhani and Angelos Filos and Marta Kwiatkowska and Joelle Pineau and Yarin Gal and Doina Precup}, title = {Invariant Causal Prediction for Block MDPs}, journal = {CoRR}, volume = {abs/2003.06016}, year = {2020}, url = {https://arxiv.org/abs/2003.06016}, eprinttype = {arXiv}, eprint = {2003.06016}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-06016.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-06350, author = {Emmanuel Bengio and Joelle Pineau and Doina Precup}, title = {Interference and Generalization in Temporal Difference Learning}, journal = {CoRR}, volume = {abs/2003.06350}, year = {2020}, url = {https://arxiv.org/abs/2003.06350}, eprinttype = {arXiv}, eprint = {2003.06350}, timestamp = {Tue, 17 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-06350.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-06560, author = {Koustuv Sinha and Shagun Sodhani and Joelle Pineau and William L. Hamilton}, title = {Evaluating Logical Generalization in Graph Neural Networks}, journal = {CoRR}, volume = {abs/2003.06560}, year = {2020}, url = {https://arxiv.org/abs/2003.06560}, eprinttype = {arXiv}, eprint = {2003.06560}, timestamp = {Tue, 17 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-06560.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-12206, author = {Joelle Pineau and Philippe Vincent{-}Lamarre and Koustuv Sinha and Vincent Larivi{\`{e}}re and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Hugo Larochelle}, title = {Improving Reproducibility in Machine Learning Research {(A} Report from the NeurIPS 2019 Reproducibility Program)}, journal = {CoRR}, volume = {abs/2003.12206}, year = {2020}, url = {https://arxiv.org/abs/2003.12206}, eprinttype = {arXiv}, eprint = {2003.12206}, timestamp = {Wed, 01 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-12206.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-00583, author = {Koustuv Sinha and Prasanna Parthasarathi and Jasmine Wang and Ryan Lowe and William L. Hamilton and Joelle Pineau}, title = {Learning an Unreferenced Metric for Online Dialogue Evaluation}, journal = {CoRR}, volume = {abs/2005.00583}, year = {2020}, url = {https://arxiv.org/abs/2005.00583}, eprinttype = {arXiv}, eprint = {2005.00583}, timestamp = {Fri, 08 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-00583.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-02431, author = {Ekaterina Kochmar and Dung Do Vu and Robert Belfer and Varun Gupta and Iulian Vlad Serban and Joelle Pineau}, title = {Automated Personalized Feedback Improves Learning Gains in an Intelligent Tutoring System}, journal = {CoRR}, volume = {abs/2005.02431}, year = {2020}, url = {https://arxiv.org/abs/2005.02431}, eprinttype = {arXiv}, eprint = {2005.02431}, timestamp = {Sat, 09 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-02431.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-03648, author = {Ge Yang and Amy Zhang and Ari S. Morcos and Joelle Pineau and Pieter Abbeel and Roberto Calandra}, title = {Plan2Vec: Unsupervised Representation Learning by Latent Plans}, journal = {CoRR}, volume = {abs/2005.03648}, year = {2020}, url = {https://arxiv.org/abs/2005.03648}, eprinttype = {arXiv}, eprint = {2005.03648}, timestamp = {Fri, 07 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-03648.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-06616, author = {Iulian Vlad Serban and Varun Gupta and Ekaterina Kochmar and Dung Do Vu and Robert Belfer and Joelle Pineau and Aaron C. Courville and Laurent Charlin and Yoshua Bengio}, title = {A Large-Scale, Open-Domain, Mixed-Interface Dialogue-Based {ITS} for {STEM}}, journal = {CoRR}, volume = {abs/2005.06616}, year = {2020}, url = {https://arxiv.org/abs/2005.06616}, eprinttype = {arXiv}, eprint = {2005.06616}, timestamp = {Fri, 22 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-06616.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-13258, author = {Paul Barde and Julien Roy and Wonseok Jeon and Joelle Pineau and Christopher J. Pal and Derek Nowrouzezahrai}, title = {Adversarial Soft Advantage Fitting: Imitation Learning without Policy Optimization}, journal = {CoRR}, volume = {abs/2006.13258}, year = {2020}, url = {https://arxiv.org/abs/2006.13258}, eprinttype = {arXiv}, eprint = {2006.13258}, timestamp = {Wed, 01 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-13258.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-01516, author = {Deepak Sharma and Audrey Durand and Marc{-}Andr{\'{e}} Legault and Louis{-}Philippe Lemieux Perreault and Audrey Lema{\c{c}}on and Marie{-}Pierre Dub{\'{e}} and Joelle Pineau}, title = {Deep interpretability for {GWAS}}, journal = {CoRR}, volume = {abs/2007.01516}, year = {2020}, url = {https://arxiv.org/abs/2007.01516}, eprinttype = {arXiv}, eprint = {2007.01516}, timestamp = {Mon, 06 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-01516.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-02786, author = {Joshua Romoff and Peter Henderson and David Kanaa and Emmanuel Bengio and Ahmed Touati and Pierre{-}Luc Bacon and Joelle Pineau}, title = {TDprop: Does Jacobi Preconditioning Help Temporal Difference Learning?}, journal = {CoRR}, volume = {abs/2007.02786}, year = {2020}, url = {https://arxiv.org/abs/2007.02786}, eprinttype = {arXiv}, eprint = {2007.02786}, timestamp = {Sat, 18 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-02786.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-07206, author = {Amy Zhang and Shagun Sodhani and Khimya Khetarpal and Joelle Pineau}, title = {Multi-Task Reinforcement Learning as a Hidden-Parameter Block {MDP}}, journal = {CoRR}, volume = {abs/2007.07206}, year = {2020}, url = {https://arxiv.org/abs/2007.07206}, eprinttype = {arXiv}, eprint = {2007.07206}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-07206.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-10427, author = {Prasanna Parthasarathi and Joelle Pineau and Sarath Chandar}, title = {How To Evaluate Your Dialogue System: Probe Tasks as an Alternative for Token-level Evaluation Metrics}, journal = {CoRR}, volume = {abs/2008.10427}, year = {2020}, url = {https://arxiv.org/abs/2008.10427}, eprinttype = {arXiv}, eprint = {2008.10427}, timestamp = {Fri, 28 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-10427.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-11811, author = {Harsh Satija and Philip Amortila and Joelle Pineau}, title = {Constrained Markov Decision Processes via Backward Value Functions}, journal = {CoRR}, volume = {abs/2008.11811}, year = {2020}, url = {https://arxiv.org/abs/2008.11811}, eprinttype = {arXiv}, eprint = {2008.11811}, timestamp = {Tue, 15 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-11811.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-13579, author = {Ruo Yu Tao and Vincent Fran{\c{c}}ois{-}Lavet and Joelle Pineau}, title = {Novelty Search in representational space for sample efficient exploration}, journal = {CoRR}, volume = {abs/2009.13579}, year = {2020}, url = {https://arxiv.org/abs/2009.13579}, eprinttype = {arXiv}, eprint = {2009.13579}, timestamp = {Wed, 30 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-13579.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-03691, author = {Wonseok Jeon and Chen{-}Yang Su and Paul Barde and Thang Doan and Derek Nowrouzezahrai and Joelle Pineau}, title = {Regularized Inverse Reinforcement Learning}, journal = {CoRR}, volume = {abs/2010.03691}, year = {2020}, url = {https://arxiv.org/abs/2010.03691}, eprinttype = {arXiv}, eprint = {2010.03691}, timestamp = {Tue, 13 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-03691.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-15896, author = {Kalesha Bullard and Franziska Meier and Douwe Kiela and Joelle Pineau and Jakob N. Foerster}, title = {Exploring Zero-Shot Emergent Communication in Embodied Multi-Agent Populations}, journal = {CoRR}, volume = {abs/2010.15896}, year = {2020}, url = {https://arxiv.org/abs/2010.15896}, eprinttype = {arXiv}, eprint = {2010.15896}, timestamp = {Tue, 03 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-15896.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-02055, author = {Melissa Mozifian and Amy Zhang and Joelle Pineau and David Meger}, title = {Intervention Design for Effective Sim2Real Transfer}, journal = {CoRR}, volume = {abs/2012.02055}, year = {2020}, url = {https://arxiv.org/abs/2012.02055}, eprinttype = {arXiv}, eprint = {2012.02055}, timestamp = {Fri, 04 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-02055.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/Francois-LavetR19, author = {Vincent Fran{\c{c}}ois{-}Lavet and Guillaume Rabusseau and Joelle Pineau and Damien Ernst and Raphael Fonteneau}, title = {On Overfitting and Asymptotic Bias in Batch Reinforcement Learning with Partial Observability}, journal = {J. Artif. Intell. Res.}, volume = {65}, pages = {1--30}, year = {2019}, url = {https://doi.org/10.1613/jair.1.11478}, doi = {10.1613/JAIR.1.11478}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jair/Francois-LavetR19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/CrawfordP19, author = {Eric Crawford and Joelle Pineau}, title = {Spatially Invariant Unsupervised Object Detection with Convolutional Neural Networks}, booktitle = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2019, The Thirty-First Innovative Applications of Artificial Intelligence Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii, USA, January 27 - February 1, 2019}, pages = {3412--3420}, publisher = {{AAAI} Press}, year = {2019}, url = {https://doi.org/10.1609/aaai.v33i01.33013412}, doi = {10.1609/AAAI.V33I01.33013412}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/CrawfordP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/DoanMAMDPH19, author = {Thang Doan and Jo{\~{a}}o Monteiro and Isabela Albuquerque and Bogdan Mazoure and Audrey Durand and Joelle Pineau and R. Devon Hjelm}, title = {On-Line Adaptative Curriculum Learning for GANs}, booktitle = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2019, The Thirty-First Innovative Applications of Artificial Intelligence Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii, USA, January 27 - February 1, 2019}, pages = {3470--3477}, publisher = {{AAAI} Press}, year = {2019}, url = {https://doi.org/10.1609/aaai.v33i01.33013470}, doi = {10.1609/AAAI.V33I01.33013470}, timestamp = {Thu, 10 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/DoanMAMDPH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/Francois-LavetB19, author = {Vincent Fran{\c{c}}ois{-}Lavet and Yoshua Bengio and Doina Precup and Joelle Pineau}, title = {Combined Reinforcement Learning via Abstract Representations}, booktitle = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2019, The Thirty-First Innovative Applications of Artificial Intelligence Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii, USA, January 27 - February 1, 2019}, pages = {3582--3589}, publisher = {{AAAI} Press}, year = {2019}, url = {https://doi.org/10.1609/aaai.v33i01.33013582}, doi = {10.1609/AAAI.V33I01.33013582}, timestamp = {Tue, 02 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aaai/Francois-LavetB19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/WangZLSP19, author = {Boyu Wang and Hejia Zhang and Peng Liu and Zebang Shen and Joelle Pineau}, editor = {Kamalika Chaudhuri and Masashi Sugiyama}, title = {Multitask Metric Learning: Theory and Algorithm}, booktitle = {The 22nd International Conference on Artificial Intelligence and Statistics, {AISTATS} 2019, 16-18 April 2019, Naha, Okinawa, Japan}, series = {Proceedings of Machine Learning Research}, volume = {89}, pages = {3362--3371}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v89/wang19f.html}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aistats/WangZLSP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/LoweFBPD19, author = {Ryan Lowe and Jakob N. Foerster and Y{-}Lan Boureau and Joelle Pineau and Yann N. Dauphin}, editor = {Edith Elkind and Manuela Veloso and Noa Agmon and Matthew E. Taylor}, title = {On the Pitfalls of Measuring Emergent Communication}, booktitle = {Proceedings of the 18th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17, 2019}, pages = {693--701}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2019}, url = {http://dl.acm.org/citation.cfm?id=3331757}, timestamp = {Wed, 24 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/LoweFBPD19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/MazoureDDPH19, author = {Bogdan Mazoure and Thang Doan and Audrey Durand and Joelle Pineau and R. Devon Hjelm}, editor = {Leslie Pack Kaelbling and Danica Kragic and Komei Sugiura}, title = {Leveraging exploration in off-policy algorithms via normalizing flows}, booktitle = {3rd Annual Conference on Robot Learning, CoRL 2019, Osaka, Japan, October 30 - November 1, 2019, Proceedings}, series = {Proceedings of Machine Learning Research}, volume = {100}, pages = {430--444}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v100/mazoure20a.html}, timestamp = {Mon, 25 May 2020 12:12:52 +0200}, biburl = {https://dblp.org/rec/conf/corl/MazoureDDPH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/GuptaLFKP19, author = {Abhinav Gupta and Ryan Lowe and Jakob N. Foerster and Douwe Kiela and Joelle Pineau}, editor = {Aditya Mogadala and Dietrich Klakow and Sandro Pezzelle and Marie{-}Francine Moens}, title = {Seeded self-play for language learning}, booktitle = {Proceedings of the Beyond Vision and LANguage: inTEgrating Real-world kNowledge, LANTERN@EMNLP-IJCNLP 2019, Hong Kong, China, November 3, 2019}, pages = {62--66}, publisher = {Association for Computational Linguistics}, year = {2019}, url = {https://doi.org/10.18653/v1/D19-6409}, doi = {10.18653/V1/D19-6409}, timestamp = {Fri, 06 Aug 2021 00:40:22 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/GuptaLFKP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/SinhaSDPH19, author = {Koustuv Sinha and Shagun Sodhani and Jin Dong and Joelle Pineau and William L. Hamilton}, editor = {Kentaro Inui and Jing Jiang and Vincent Ng and Xiaojun Wan}, title = {{CLUTRR:} {A} Diagnostic Benchmark for Inductive Reasoning from Text}, booktitle = {Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China, November 3-7, 2019}, pages = {4505--4514}, publisher = {Association for Computational Linguistics}, year = {2019}, url = {https://doi.org/10.18653/v1/D19-1458}, doi = {10.18653/V1/D19-1458}, timestamp = {Thu, 07 Apr 2022 09:14:07 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/SinhaSDPH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/DasGRBPRP19, author = {Abhishek Das and Th{\'{e}}ophile Gervet and Joshua Romoff and Dhruv Batra and Devi Parikh and Mike Rabbat and Joelle Pineau}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {TarMAC: Targeted Multi-Agent Communication}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {1538--1546}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/das19a.html}, timestamp = {Tue, 11 Jun 2019 15:37:38 +0200}, biburl = {https://dblp.org/rec/conf/icml/DasGRBPRP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/Romoff0TOPB19, author = {Joshua Romoff and Peter Henderson and Ahmed Touati and Yann Ollivier and Joelle Pineau and Emma Brunskill}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {Separable value functions across time-scales}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {5468--5477}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/romoff19a.html}, timestamp = {Tue, 11 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/Romoff0TOPB19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/CacciaHCP19, author = {Lucas Caccia and Herke van Hoof and Aaron C. Courville and Joelle Pineau}, title = {Deep Generative Modeling of LiDAR Data}, booktitle = {2019 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2019, Macau, SAR, China, November 3-8, 2019}, pages = {5034--5040}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/IROS40897.2019.8968535}, doi = {10.1109/IROS40897.2019.8968535}, timestamp = {Fri, 31 Jan 2020 10:27:14 +0100}, biburl = {https://dblp.org/rec/conf/iros/CacciaHCP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PaquetteLBSOKPS19, author = {Philip Paquette and Yuchen Lu and Steven Bocco and Max O. Smith and Satya Ortiz{-}Gagne and Jonathan K. Kummerfeld and Joelle Pineau and Satinder Singh and Aaron C. Courville}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {No-Press Diplomacy: Modeling Multi-Agent Gameplay}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {4476--4487}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/84b20b1f5a0d103f5710bb67a043cd78-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/PaquetteLBSOKPS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/AssranRBPR19, author = {Mahmoud Assran and Joshua Romoff and Nicolas Ballas and Joelle Pineau and Mike Rabbat}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {Gossip-based Actor-Learner Architectures for Deep Reinforcement Learning}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {13299--13309}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/a1a527267c0d33a86382a03c4c721cd2-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/AssranRBPR19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uai/TouatiSRPV19, author = {Ahmed Touati and Harsh Satija and Joshua Romoff and Joelle Pineau and Pascal Vincent}, editor = {Amir Globerson and Ricardo Silva}, title = {Randomized Value Functions via Multiplicative Normalizing Flows}, booktitle = {Proceedings of the Thirty-Fifth Conference on Uncertainty in Artificial Intelligence, {UAI} 2019, Tel Aviv, Israel, July 22-25, 2019}, series = {Proceedings of Machine Learning Research}, volume = {115}, pages = {422--432}, publisher = {{AUAI} Press}, year = {2019}, url = {http://proceedings.mlr.press/v115/touati20a.html}, timestamp = {Tue, 15 Dec 2020 17:40:18 +0100}, biburl = {https://dblp.org/rec/conf/uai/TouatiSRPV19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-00098, author = {Emily Dinan and Varvara Logacheva and Valentin Malykh and Alexander H. Miller and Kurt Shuster and Jack Urbanek and Douwe Kiela and Arthur Szlam and Iulian Serban and Ryan Lowe and Shrimai Prabhumoye and Alan W. Black and Alexander I. Rudnicky and Jason D. Williams and Joelle Pineau and Mikhail Burtsev and Jason Weston}, title = {The Second Conversational Intelligence Challenge (ConvAI2)}, journal = {CoRR}, volume = {abs/1902.00098}, year = {2019}, url = {http://arxiv.org/abs/1902.00098}, eprinttype = {arXiv}, eprint = {1902.00098}, timestamp = {Fri, 01 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-00098.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-01883, author = {Joshua Romoff and Peter Henderson and Ahmed Touati and Yann Ollivier and Emma Brunskill and Joelle Pineau}, title = {Separating value functions across time-scales}, journal = {CoRR}, volume = {abs/1902.01883}, year = {2019}, url = {http://arxiv.org/abs/1902.01883}, eprinttype = {arXiv}, eprint = {1902.01883}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-01883.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1903-05168, author = {Ryan Lowe and Jakob N. Foerster and Y{-}Lan Boureau and Joelle Pineau and Yann N. Dauphin}, title = {On the Pitfalls of Measuring Emergent Communication}, journal = {CoRR}, volume = {abs/1903.05168}, year = {2019}, url = {http://arxiv.org/abs/1903.05168}, eprinttype = {arXiv}, eprint = {1903.05168}, timestamp = {Wed, 24 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1903-05168.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-06893, author = {Bogdan Mazoure and Thang Doan and Audrey Durand and R. Devon Hjelm and Joelle Pineau}, title = {Leveraging exploration in off-policy algorithms via normalizing flows}, journal = {CoRR}, volume = {abs/1905.06893}, year = {2019}, url = {http://arxiv.org/abs/1905.06893}, eprinttype = {arXiv}, eprint = {1905.06893}, timestamp = {Tue, 28 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-06893.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-09562, author = {Pierre Thodoroff and Nishanth Anand and Lucas Caccia and Doina Precup and Joelle Pineau}, title = {Recurrent Value Functions}, journal = {CoRR}, volume = {abs/1905.09562}, year = {2019}, url = {http://arxiv.org/abs/1905.09562}, eprinttype = {arXiv}, eprint = {1905.09562}, timestamp = {Wed, 29 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-09562.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-04585, author = {Mahmoud Assran and Joshua Romoff and Nicolas Ballas and Joelle Pineau and Mike Rabbat}, title = {Gossip-based Actor-Learner Architectures for Deep Reinforcement Learning}, journal = {CoRR}, volume = {abs/1906.04585}, year = {2019}, url = {http://arxiv.org/abs/1906.04585}, eprinttype = {arXiv}, eprint = {1906.04585}, timestamp = {Fri, 14 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-04585.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-10437, author = {Amy Zhang and Zachary C. Lipton and Luis Pineda and Kamyar Azizzadenesheli and Anima Anandkumar and Laurent Itti and Joelle Pineau and Tommaso Furlanello}, title = {Learning Causal State Representations of Partially Observable Environments}, journal = {CoRR}, volume = {abs/1906.10437}, year = {2019}, url = {http://arxiv.org/abs/1906.10437}, eprinttype = {arXiv}, eprint = {1906.10437}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-10437.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1908-06177, author = {Koustuv Sinha and Shagun Sodhani and Jin Dong and Joelle Pineau and William L. Hamilton}, title = {{CLUTRR:} {A} Diagnostic Benchmark for Inductive Reasoning from Text}, journal = {CoRR}, volume = {abs/1908.06177}, year = {2019}, url = {http://arxiv.org/abs/1908.06177}, eprinttype = {arXiv}, eprint = {1908.06177}, timestamp = {Mon, 26 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1908-06177.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1909-02128, author = {Philip Paquette and Yuchen Lu and Steven Bocco and Max O. Smith and Satya Ortiz{-}Gagne and Jonathan K. Kummerfeld and Satinder Singh and Joelle Pineau and Aaron C. Courville}, title = {No Press Diplomacy: Modeling Multi-Agent Gameplay}, journal = {CoRR}, volume = {abs/1909.02128}, year = {2019}, url = {http://arxiv.org/abs/1909.02128}, eprinttype = {arXiv}, eprint = {1909.02128}, timestamp = {Thu, 21 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1909-02128.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1909-07543, author = {Thang Doan and Bogdan Mazoure and Audrey Durand and Joelle Pineau and R. Devon Hjelm}, title = {Attraction-Repulsion Actor-Critic for Continuous Control Reinforcement Learning}, journal = {CoRR}, volume = {abs/1909.07543}, year = {2019}, url = {http://arxiv.org/abs/1909.07543}, eprinttype = {arXiv}, eprint = {1909.07543}, timestamp = {Mon, 23 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1909-07543.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-01708, author = {Scott Fujimoto and Edoardo Conti and Mohammad Ghavamzadeh and Joelle Pineau}, title = {Benchmarking Batch Deep Reinforcement Learning Algorithms}, journal = {CoRR}, volume = {abs/1910.01708}, year = {2019}, url = {http://arxiv.org/abs/1910.01708}, eprinttype = {arXiv}, eprint = {1910.01708}, timestamp = {Wed, 09 Oct 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-01708.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-01741, author = {Denis Yarats and Amy Zhang and Ilya Kostrikov and Brandon Amos and Joelle Pineau and Rob Fergus}, title = {Improving Sample Efficiency in Model-Free Reinforcement Learning from Images}, journal = {CoRR}, volume = {abs/1910.01741}, year = {2019}, url = {http://arxiv.org/abs/1910.01741}, eprinttype = {arXiv}, eprint = {1910.01741}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-01741.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-04054, author = {Viswanath Sivakumar and Tim Rockt{\"{a}}schel and Alexander H. Miller and Heinrich K{\"{u}}ttler and Nantas Nardelli and Mike Rabbat and Joelle Pineau and Sebastian Riedel}, title = {{MVFST-RL:} An Asynchronous {RL} Framework for Congestion Control with Delayed Actions}, journal = {CoRR}, volume = {abs/1910.04054}, year = {2019}, url = {http://arxiv.org/abs/1910.04054}, eprinttype = {arXiv}, eprint = {1910.04054}, timestamp = {Wed, 16 Oct 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-04054.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-08019, author = {Lucas Caccia and Eugene Belilovsky and Massimo Caccia and Joelle Pineau}, title = {Online Learned Continual Compression with Stacked Quantization Module}, journal = {CoRR}, volume = {abs/1911.08019}, year = {2019}, url = {http://arxiv.org/abs/1911.08019}, eprinttype = {arXiv}, eprint = {1911.08019}, timestamp = {Mon, 02 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-08019.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-09033, author = {Eric Crawford and Joelle Pineau}, title = {Exploiting Spatial Invariance for Scalable Unsupervised Object Tracking}, journal = {CoRR}, volume = {abs/1911.09033}, year = {2019}, url = {http://arxiv.org/abs/1911.09033}, eprinttype = {arXiv}, eprint = {1911.09033}, timestamp = {Tue, 03 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-09033.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/dad/SerbanLHCP18, author = {Iulian Vlad Serban and Ryan Lowe and Peter Henderson and Laurent Charlin and Joelle Pineau}, title = {A Survey of Available Corpora For Building Data-Driven Dialogue Systems: The Journal Version}, journal = {Dialogue Discourse}, volume = {9}, number = {1}, pages = {1--49}, year = {2018}, url = {http://dad.uni-bielefeld.de/index.php/dad/article/view/3690}, timestamp = {Wed, 20 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/dad/SerbanLHCP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ftml/Francois-LavetH18, author = {Vincent Fran{\c{c}}ois{-}Lavet and Peter Henderson and Riashat Islam and Marc G. Bellemare and Joelle Pineau}, title = {An Introduction to Deep Reinforcement Learning}, journal = {Found. Trends Mach. Learn.}, volume = {11}, number = {3-4}, pages = {219--354}, year = {2018}, url = {https://doi.org/10.1561/2200000071}, doi = {10.1561/2200000071}, timestamp = {Thu, 18 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ftml/Francois-LavetH18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijsr/GhorbelPGJS18, author = {Mahmoud Ghorbel and Joelle Pineau and Richard Gourdeau and Shervin Javdani and Siddhartha S. Srinivasa}, title = {A Decision-Theoretic Approach for the Collaborative Control of a Smart Wheelchair}, journal = {Int. J. Soc. Robotics}, volume = {10}, number = {1}, pages = {131--145}, year = {2018}, url = {https://doi.org/10.1007/s12369-017-0434-7}, doi = {10.1007/S12369-017-0434-7}, timestamp = {Fri, 25 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ijsr/GhorbelPGJS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/DurandMP18, author = {Audrey Durand and Odalric{-}Ambrym Maillard and Joelle Pineau}, title = {Streaming kernel regression with provably adaptive mean, variance, and regularization}, journal = {J. Mach. Learn. Res.}, volume = {19}, pages = {17:1--17:34}, year = {2018}, url = {https://jmlr.org/papers/v19/17-404.html}, timestamp = {Wed, 11 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/DurandMP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/0002CBMPP18, author = {Peter Henderson and Wei{-}Di Chang and Pierre{-}Luc Bacon and David Meger and Joelle Pineau and Doina Precup}, editor = {Sheila A. McIlraith and Kilian Q. Weinberger}, title = {OptionGAN: Learning Joint Reward-Policy Options Using Generative Adversarial Inverse Reinforcement Learning}, booktitle = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence, (AAAI-18), the 30th innovative Applications of Artificial Intelligence (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February 2-7, 2018}, pages = {3199--3206}, publisher = {{AAAI} Press}, year = {2018}, url = {https://doi.org/10.1609/aaai.v32i1.11775}, doi = {10.1609/AAAI.V32I1.11775}, timestamp = {Sat, 21 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/0002CBMPP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/0002IBPPM18, author = {Peter Henderson and Riashat Islam and Philip Bachman and Joelle Pineau and Doina Precup and David Meger}, editor = {Sheila A. McIlraith and Kilian Q. Weinberger}, title = {Deep Reinforcement Learning That Matters}, booktitle = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence, (AAAI-18), the 30th innovative Applications of Artificial Intelligence (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February 2-7, 2018}, pages = {3207--3214}, publisher = {{AAAI} Press}, year = {2018}, url = {https://doi.org/10.1609/aaai.v32i1.11694}, doi = {10.1609/AAAI.V32I1.11694}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/0002IBPPM18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aies/0002SAKFLP18, author = {Peter Henderson and Koustuv Sinha and Nicolas Angelard{-}Gontier and Nan Rosemary Ke and Genevieve Fried and Ryan Lowe and Joelle Pineau}, editor = {Jason Furman and Gary E. Marchant and Huw Price and Francesca Rossi}, title = {Ethical Challenges in Data-Driven Dialogue Systems}, booktitle = {Proceedings of the 2018 {AAAI/ACM} Conference on AI, Ethics, and Society, {AIES} 2018, New Orleans, LA, USA, February 02-03, 2018}, pages = {123--129}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3278721.3278777}, doi = {10.1145/3278721.3278777}, timestamp = {Tue, 23 Jan 2024 13:25:45 +0100}, biburl = {https://dblp.org/rec/conf/aies/0002SAKFLP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/Romoff0PFP18, author = {Joshua Romoff and Peter Henderson and Alexandre Pich{\'{e}} and Vincent Fran{\c{c}}ois{-}Lavet and Joelle Pineau}, title = {Reward Estimation for Variance Reduction in Deep Reinforcement Learning}, booktitle = {2nd Annual Conference on Robot Learning, CoRL 2018, Z{\"{u}}rich, Switzerland, 29-31 October 2018, Proceedings}, series = {Proceedings of Machine Learning Research}, volume = {87}, pages = {674--699}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v87/romoff18a.html}, timestamp = {Wed, 03 Apr 2019 18:17:24 +0200}, biburl = {https://dblp.org/rec/conf/corl/Romoff0PFP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ParthasarathiP18, author = {Prasanna Parthasarathi and Joelle Pineau}, editor = {Ellen Riloff and David Chiang and Julia Hockenmaier and Jun'ichi Tsujii}, title = {Extending Neural Generative Conversational Model using External Knowledge Sources}, booktitle = {Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, Brussels, Belgium, October 31 - November 4, 2018}, pages = {690--695}, publisher = {Association for Computational Linguistics}, year = {2018}, url = {https://doi.org/10.18653/v1/d18-1073}, doi = {10.18653/V1/D18-1073}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/ParthasarathiP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/RomoffP0FP18, author = {Joshua Romoff and Alexandre Pich{\'{e}} and Peter Henderson and Vincent Fran{\c{c}}ois{-}Lavet and Joelle Pineau}, title = {Reward Estimation for Variance Reduction in Deep Reinforcement Learning}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=r1vcHYJvM}, timestamp = {Thu, 04 Apr 2019 13:20:09 +0200}, biburl = {https://dblp.org/rec/conf/iclr/RomoffP0FP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ZhangSP18, author = {Amy Zhang and Harsh Satija and Joelle Pineau}, title = {Decoupling Dynamics and Reward for Transfer Learning}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=H1aoddyvM}, timestamp = {Tue, 01 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ZhangSP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KeZSLTBPCP18, author = {Nan Rosemary Ke and Konrad Zolna and Alessandro Sordoni and Zhouhan Lin and Adam Trischler and Yoshua Bengio and Joelle Pineau and Laurent Charlin and Christopher J. Pal}, editor = {Jennifer G. Dy and Andreas Krause}, title = {Focused Hierarchical RNNs for Conditional Sequence Processing}, booktitle = {Proceedings of the 35th International Conference on Machine Learning, {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July 10-15, 2018}, series = {Proceedings of Machine Learning Research}, volume = {80}, pages = {2559--2568}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v80/ke18a.html}, timestamp = {Wed, 03 Apr 2019 18:17:30 +0200}, biburl = {https://dblp.org/rec/conf/icml/KeZSLTBPCP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/SmithHP18, author = {Matthew J. A. Smith and Herke van Hoof and Joelle Pineau}, editor = {Jennifer G. Dy and Andreas Krause}, title = {An Inference-Based Policy Gradient Method for Learning Options}, booktitle = {Proceedings of the 35th International Conference on Machine Learning, {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July 10-15, 2018}, series = {Proceedings of Machine Learning Research}, volume = {80}, pages = {4710--4719}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v80/smith18a.html}, timestamp = {Thu, 07 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/SmithHP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/mlhc/DurandAISMP18, author = {Audrey Durand and Charis Achilleos and Demetris Iacovides and Katerina Strati and Georgios D. Mitsis and Joelle Pineau}, editor = {Finale Doshi{-}Velez and Jim Fackler and Ken Jung and David C. Kale and Rajesh Ranganath and Byron C. Wallace and Jenna Wiens}, title = {Contextual Bandits for Adapting Treatment in a Mouse Model of de Novo Carcinogenesis}, booktitle = {Proceedings of the Machine Learning for Healthcare Conference, {MLHC} 2018, 17-18 August 2018, Palo Alto, California}, series = {Proceedings of Machine Learning Research}, volume = {85}, pages = {67--82}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v85/durand18a.html}, timestamp = {Wed, 03 Apr 2019 18:17:31 +0200}, biburl = {https://dblp.org/rec/conf/mlhc/DurandAISMP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ThodoroffDPP18, author = {Pierre Thodoroff and Audrey Durand and Joelle Pineau and Doina Precup}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {Temporal Regularization for Markov Decision Process}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {1784--1794}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/4b0250793549726d5c1ea3906726ebfe-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/ThodoroffDPP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1801-06700, author = {Iulian Vlad Serban and Chinnadhurai Sankar and Mathieu Germain and Saizheng Zhang and Zhouhan Lin and Sandeep Subramanian and Taesup Kim and Michael Pieper and Sarath Chandar and Nan Rosemary Ke and Sai Rajeswar and Alexandre de Br{\'{e}}bisson and Jose M. R. Sotelo and Dendi Suhubdy and Vincent Michalski and Alexandre Nguyen and Joelle Pineau and Yoshua Bengio}, title = {A Deep Reinforcement Learning Chatbot (Short Version)}, journal = {CoRR}, volume = {abs/1801.06700}, year = {2018}, url = {http://arxiv.org/abs/1801.06700}, eprinttype = {arXiv}, eprint = {1801.06700}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1801-06700.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1802-09484, author = {Valentin Thomas and Emmanuel Bengio and William Fedus and Jules Pondard and Philippe Beaudoin and Hugo Larochelle and Joelle Pineau and Doina Precup and Yoshua Bengio}, title = {Disentangling the independently controllable factors of variation by interacting with the world}, journal = {CoRR}, volume = {abs/1802.09484}, year = {2018}, url = {http://arxiv.org/abs/1802.09484}, eprinttype = {arXiv}, eprint = {1802.09484}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1802-09484.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1804-10689, author = {Amy Zhang and Harsh Satija and Joelle Pineau}, title = {Decoupling Dynamics and Reward for Transfer Learning}, journal = {CoRR}, volume = {abs/1804.10689}, year = {2018}, url = {http://arxiv.org/abs/1804.10689}, eprinttype = {arXiv}, eprint = {1804.10689}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1804-10689.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1805-03359, author = {Joshua Romoff and Alexandre Pich{\'{e}} and Peter Henderson and Vincent Fran{\c{c}}ois{-}Lavet and Joelle Pineau}, title = {Reward Estimation for Variance Reduction in Deep Reinforcement Learning}, journal = {CoRR}, volume = {abs/1805.03359}, year = {2018}, url = {http://arxiv.org/abs/1805.03359}, eprinttype = {arXiv}, eprint = {1805.03359}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1805-03359.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-02315, author = {Ahmed Touati and Harsh Satija and Joshua Romoff and Joelle Pineau and Pascal Vincent}, title = {Randomized Value Functions via Multiplicative Normalizing Flows}, journal = {CoRR}, volume = {abs/1806.02315}, year = {2018}, url = {http://arxiv.org/abs/1806.02315}, eprinttype = {arXiv}, eprint = {1806.02315}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-02315.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-04342, author = {Nan Rosemary Ke and Konrad Zolna and Alessandro Sordoni and Zhouhan Lin and Adam Trischler and Yoshua Bengio and Joelle Pineau and Laurent Charlin and Chris Pal}, title = {Focused Hierarchical RNNs for Conditional Sequence Processing}, journal = {CoRR}, volume = {abs/1806.04342}, year = {2018}, url = {http://arxiv.org/abs/1806.04342}, eprinttype = {arXiv}, eprint = {1806.04342}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-04342.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-07937, author = {Amy Zhang and Nicolas Ballas and Joelle Pineau}, title = {A Dissection of Overfitting and Generalization in Continuous Reinforcement Learning}, journal = {CoRR}, volume = {abs/1806.07937}, year = {2018}, url = {http://arxiv.org/abs/1806.07937}, eprinttype = {arXiv}, eprint = {1806.07937}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-07937.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1807-04723, author = {Iulian Vlad Serban and Chinnadhurai Sankar and Michael Pieper and Joelle Pineau and Yoshua Bengio}, title = {The Bottleneck Simulator: {A} Model-based Deep Reinforcement Learning Approach}, journal = {CoRR}, volume = {abs/1807.04723}, year = {2018}, url = {http://arxiv.org/abs/1807.04723}, eprinttype = {arXiv}, eprint = {1807.04723}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1807-04723.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1808-00020, author = {Thang Doan and Jo{\~{a}}o Monteiro and Isabela Albuquerque and Bogdan Mazoure and Audrey Durand and Joelle Pineau and R. Devon Hjelm}, title = {Online Adaptative Curriculum Learning for GANs}, journal = {CoRR}, volume = {abs/1808.00020}, year = {2018}, url = {http://arxiv.org/abs/1808.00020}, eprinttype = {arXiv}, eprint = {1808.00020}, timestamp = {Thu, 10 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1808-00020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-04506, author = {Vincent Fran{\c{c}}ois{-}Lavet and Yoshua Bengio and Doina Precup and Joelle Pineau}, title = {Combined Reinforcement Learning via Abstract Representations}, journal = {CoRR}, volume = {abs/1809.04506}, year = {2018}, url = {http://arxiv.org/abs/1809.04506}, eprinttype = {arXiv}, eprint = {1809.04506}, timestamp = {Fri, 05 Oct 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-04506.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-04988, author = {Eric Crawford and Guillaume Rabusseau and Joelle Pineau}, title = {Sequential Coordination of Deep Models for Learning Visual Arithmetic}, journal = {CoRR}, volume = {abs/1809.04988}, year = {2018}, url = {http://arxiv.org/abs/1809.04988}, eprinttype = {arXiv}, eprint = {1809.04988}, timestamp = {Fri, 05 Oct 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-04988.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-05524, author = {Prasanna Parthasarathi and Joelle Pineau}, title = {Extending Neural Generative Conversational Model using External Knowledge Sources}, journal = {CoRR}, volume = {abs/1809.05524}, year = {2018}, url = {http://arxiv.org/abs/1809.05524}, eprinttype = {arXiv}, eprint = {1809.05524}, timestamp = {Fri, 05 Oct 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-05524.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-02525, author = {Peter Henderson and Joshua Romoff and Joelle Pineau}, title = {Where Did My Optimum Go?: An Empirical Analysis of Gradient Descent Optimization in Policy Gradient Methods}, journal = {CoRR}, volume = {abs/1810.02525}, year = {2018}, url = {http://arxiv.org/abs/1810.02525}, eprinttype = {arXiv}, eprint = {1810.02525}, timestamp = {Tue, 30 Oct 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-02525.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-11187, author = {Abhishek Das and Th{\'{e}}ophile Gervet and Joshua Romoff and Dhruv Batra and Devi Parikh and Michael G. Rabbat and Joelle Pineau}, title = {TarMAC: Targeted Multi-Agent Communication}, journal = {CoRR}, volume = {abs/1810.11187}, year = {2018}, url = {http://arxiv.org/abs/1810.11187}, eprinttype = {arXiv}, eprint = {1810.11187}, timestamp = {Mon, 09 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-11187.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-00429, author = {Pierre Thodoroff and Audrey Durand and Joelle Pineau and Doina Precup}, title = {Temporal Regularization in Markov Decision Process}, journal = {CoRR}, volume = {abs/1811.00429}, year = {2018}, url = {http://arxiv.org/abs/1811.00429}, eprinttype = {arXiv}, eprint = {1811.00429}, timestamp = {Thu, 22 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-00429.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-01302, author = {Peter Henderson and Koustuv Sinha and Nan Rosemary Ke and Joelle Pineau}, title = {Adversarial Gain}, journal = {CoRR}, volume = {abs/1811.01302}, year = {2018}, url = {http://arxiv.org/abs/1811.01302}, eprinttype = {arXiv}, eprint = {1811.01302}, timestamp = {Thu, 22 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-01302.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-02549, author = {Massimo Caccia and Lucas Caccia and William Fedus and Hugo Larochelle and Joelle Pineau and Laurent Charlin}, title = {Language GANs Falling Short}, journal = {CoRR}, volume = {abs/1811.02549}, year = {2018}, url = {http://arxiv.org/abs/1811.02549}, eprinttype = {arXiv}, eprint = {1811.02549}, timestamp = {Thu, 22 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-02549.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-02714, author = {Nicolas Gontier and Koustuv Sinha and Peter Henderson and Iulian Serban and Michael Noseworthy and Prasanna Parthasarathi and Joelle Pineau}, title = {The RLLChatbot: a solution to the ConvAI challenge}, journal = {CoRR}, volume = {abs/1811.02714}, year = {2018}, url = {http://arxiv.org/abs/1811.02714}, eprinttype = {arXiv}, eprint = {1811.02714}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-02714.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-02959, author = {Koustuv Sinha and Shagun Sodhani and William L. Hamilton and Joelle Pineau}, title = {Compositional Language Understanding with Text-based Relational Reasoning}, journal = {CoRR}, volume = {abs/1811.02959}, year = {2018}, url = {http://arxiv.org/abs/1811.02959}, eprinttype = {arXiv}, eprint = {1811.02959}, timestamp = {Thu, 22 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-02959.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-06032, author = {Amy Zhang and Yuxin Wu and Joelle Pineau}, title = {Natural Environment Benchmarks for Reinforcement Learning}, journal = {CoRR}, volume = {abs/1811.06032}, year = {2018}, url = {http://arxiv.org/abs/1811.06032}, eprinttype = {arXiv}, eprint = {1811.06032}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-06032.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-12560, author = {Vincent Fran{\c{c}}ois{-}Lavet and Peter Henderson and Riashat Islam and Marc G. Bellemare and Joelle Pineau}, title = {An Introduction to Deep Reinforcement Learning}, journal = {CoRR}, volume = {abs/1811.12560}, year = {2018}, url = {http://arxiv.org/abs/1811.12560}, eprinttype = {arXiv}, eprint = {1811.12560}, timestamp = {Mon, 03 Dec 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-12560.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1812-01180, author = {Lucas Caccia and Herke van Hoof and Aaron C. Courville and Joelle Pineau}, title = {Deep Generative Modeling of LiDAR Data}, journal = {CoRR}, volume = {abs/1812.01180}, year = {2018}, url = {http://arxiv.org/abs/1812.01180}, eprinttype = {arXiv}, eprint = {1812.01180}, timestamp = {Tue, 01 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1812-01180.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/dad/LowePSCLP17, author = {Ryan Thomas Lowe and Nissan Pow and Iulian Vlad Serban and Laurent Charlin and Chia{-}Wei Liu and Joelle Pineau}, title = {Training End-to-End Dialogue Systems with the Ubuntu Dialogue Corpus}, journal = {Dialogue Discourse}, volume = {8}, number = {1}, pages = {31--65}, year = {2017}, url = {http://dad.uni-bielefeld.de/index.php/dad/article/view/3698}, timestamp = {Wed, 20 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/dad/LowePSCLP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/titb/EmamiYRPCH17, author = {Ali Emami and Joseph El Youssef and Remi Rabasa{-}Lhoret and Joelle Pineau and Jessica R. Castle and Ahmad Haidar}, title = {Modeling Glucagon Action in Patients With Type 1 Diabetes}, journal = {{IEEE} J. Biomed. Health Informatics}, volume = {21}, number = {4}, pages = {1163--1171}, year = {2017}, url = {https://doi.org/10.1109/JBHI.2016.2593630}, doi = {10.1109/JBHI.2016.2593630}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/titb/EmamiYRPCH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/SerbanSLCPCB17, author = {Iulian Vlad Serban and Alessandro Sordoni and Ryan Lowe and Laurent Charlin and Joelle Pineau and Aaron C. Courville and Yoshua Bengio}, editor = {Satinder Singh and Shaul Markovitch}, title = {A Hierarchical Latent Variable Encoder-Decoder Model for Generating Dialogues}, booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, February 4-9, 2017, San Francisco, California, {USA}}, pages = {3295--3301}, publisher = {{AAAI} Press}, year = {2017}, url = {https://doi.org/10.1609/aaai.v31i1.10983}, doi = {10.1609/AAAI.V31I1.10983}, timestamp = {Mon, 04 Sep 2023 14:40:32 +0200}, biburl = {https://dblp.org/rec/conf/aaai/SerbanSLCPCB17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/LoweNSABP17, author = {Ryan Lowe and Michael Noseworthy and Iulian Vlad Serban and Nicolas Angelard{-}Gontier and Yoshua Bengio and Joelle Pineau}, editor = {Regina Barzilay and Min{-}Yen Kan}, title = {Towards an Automatic Turing Test: Learning to Evaluate Dialogue Responses}, booktitle = {Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume 1: Long Papers}, pages = {1116--1126}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/P17-1103}, doi = {10.18653/V1/P17-1103}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/LoweNSABP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ai/SmithCP17, author = {Matthew Smith and Laurent Charlin and Joelle Pineau}, editor = {Malek Mouhoub and Philippe Langlais}, title = {A Sparse Probabilistic Model of User Preference Data}, booktitle = {Advances in Artificial Intelligence - 30th Canadian Conference on Artificial Intelligence, Canadian {AI} 2017, Edmonton, AB, Canada, May 16-19, 2017, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {10233}, pages = {316--328}, year = {2017}, url = {https://doi.org/10.1007/978-3-319-57351-9\_36}, doi = {10.1007/978-3-319-57351-9\_36}, timestamp = {Thu, 28 Sep 2023 12:27:16 +0200}, biburl = {https://dblp.org/rec/conf/ai/SmithCP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/SerbanOPC17a, author = {Iulian Vlad Serban and Alexander Ororbia and Joelle Pineau and Aaron C. Courville}, editor = {Kai{-}Wei Chang and Ming{-}Wei Chang and Vivek Srikumar and Alexander M. Rush}, title = {Piecewise Latent Variables for Neural Variational Text Processing}, booktitle = {Proceedings of the 2nd Workshop on Structured Prediction for Natural Language Processing, SPNLP@EMNLP, Copenhagen, Denmark, September 2017}, pages = {52--62}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/w17-4308}, doi = {10.18653/V1/W17-4308}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/SerbanOPC17a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/SerbanOPC17, author = {Iulian Vlad Serban and Alexander G. Ororbia II and Joelle Pineau and Aaron C. Courville}, editor = {Martha Palmer and Rebecca Hwa and Sebastian Riedel}, title = {Piecewise Latent Variables for Neural Variational Text Processing}, booktitle = {Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2017, Copenhagen, Denmark, September 9-11, 2017}, pages = {422--432}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/d17-1043}, doi = {10.18653/V1/D17-1043}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/SerbanOPC17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/BahdanauBXGLPCB17, author = {Dzmitry Bahdanau and Philemon Brakel and Kelvin Xu and Anirudh Goyal and Ryan Lowe and Joelle Pineau and Aaron C. Courville and Yoshua Bengio}, title = {An Actor-Critic Algorithm for Sequence Prediction}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=SJDaqqveg}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/BahdanauBXGLPCB17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/LoweNSABP17, author = {Ryan Lowe and Michael Noseworthy and Iulian Vlad Serban and Nicolas Angelard{-}Gontier and Yoshua Bengio and Joelle Pineau}, title = {Towards an automatic Turing test: Learning to evaluate dialogue responses}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=Sk7c3yVYg}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/LoweNSABP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/RabusseauBP17, author = {Guillaume Rabusseau and Borja Balle and Joelle Pineau}, editor = {Isabelle Guyon and Ulrike von Luxburg and Samy Bengio and Hanna M. Wallach and Rob Fergus and S. V. N. Vishwanathan and Roman Garnett}, title = {Multitask Spectral Learning of Weighted Automata}, booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4-9, 2017, Long Beach, CA, {USA}}, pages = {2588--2597}, year = {2017}, url = {https://proceedings.neurips.cc/paper/2017/hash/e655c7716a4b3ea67f48c6322fc42ed6-Abstract.html}, timestamp = {Thu, 21 Jan 2021 13:58:27 +0100}, biburl = {https://dblp.org/rec/conf/nips/RabusseauBP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigdial/TruongPP17, author = {Hoai Phuoc Truong and Prasanna Parthasarathi and Joelle Pineau}, editor = {Kristiina Jokinen and Manfred Stede and David DeVault and Annie Louis}, title = {{MACA:} {A} Modular Architecture for Conversational Agents}, booktitle = {Proceedings of the 18th Annual SIGdial Meeting on Discourse and Dialogue, Saarbr{\"{u}}cken, Germany, August 15-17, 2017}, pages = {93--102}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/w17-5513}, doi = {10.18653/V1/W17-5513}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sigdial/TruongPP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigdial/NoseworthyCP17, author = {Michael Noseworthy and Jackie Chi Kit Cheung and Joelle Pineau}, editor = {Kristiina Jokinen and Manfred Stede and David DeVault and Annie Louis}, title = {Predicting Success in Goal-Driven Human-Human Dialogues}, booktitle = {Proceedings of the 18th Annual SIGdial Meeting on Discourse and Dialogue, Saarbr{\"{u}}cken, Germany, August 15-17, 2017}, pages = {253--262}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/w17-5531}, doi = {10.18653/V1/W17-5531}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sigdial/NoseworthyCP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BengioTPPB17, author = {Emmanuel Bengio and Valentin Thomas and Joelle Pineau and Doina Precup and Yoshua Bengio}, title = {Independently Controllable Features}, journal = {CoRR}, volume = {abs/1703.07718}, year = {2017}, url = {http://arxiv.org/abs/1703.07718}, eprinttype = {arXiv}, eprint = {1703.07718}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BengioTPPB17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1708-00768, author = {Audrey Durand and Odalric{-}Ambrym Maillard and Joelle Pineau}, title = {Streaming kernel regression with provably adaptive mean, variance, and regularization}, journal = {CoRR}, volume = {abs/1708.00768}, year = {2017}, url = {http://arxiv.org/abs/1708.00768}, eprinttype = {arXiv}, eprint = {1708.00768}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1708-00768.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1708-01289, author = {Valentin Thomas and Jules Pondard and Emmanuel Bengio and Marc Sarfati and Philippe Beaudoin and Marie{-}Jean Meurs and Joelle Pineau and Doina Precup and Yoshua Bengio}, title = {Independently Controllable Factors}, journal = {CoRR}, volume = {abs/1708.01289}, year = {2017}, url = {http://arxiv.org/abs/1708.01289}, eprinttype = {arXiv}, eprint = {1708.01289}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1708-01289.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1708-07149, author = {Ryan Lowe and Michael Noseworthy and Iulian Vlad Serban and Nicolas Angelard{-}Gontier and Yoshua Bengio and Joelle Pineau}, title = {Towards an Automatic Turing Test: Learning to Evaluate Dialogue Responses}, journal = {CoRR}, volume = {abs/1708.07149}, year = {2017}, url = {http://arxiv.org/abs/1708.07149}, eprinttype = {arXiv}, eprint = {1708.07149}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1708-07149.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-02349, author = {Iulian Vlad Serban and Chinnadhurai Sankar and Mathieu Germain and Saizheng Zhang and Zhouhan Lin and Sandeep Subramanian and Taesup Kim and Michael Pieper and Sarath Chandar and Nan Rosemary Ke and Sai Mudumba and Alexandre de Br{\'{e}}bisson and Jose Sotelo and Dendi Suhubdy and Vincent Michalski and Alexandre Nguyen and Joelle Pineau and Yoshua Bengio}, title = {A Deep Reinforcement Learning Chatbot}, journal = {CoRR}, volume = {abs/1709.02349}, year = {2017}, url = {http://arxiv.org/abs/1709.02349}, eprinttype = {arXiv}, eprint = {1709.02349}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-02349.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-06560, author = {Peter Henderson and Riashat Islam and Philip Bachman and Joelle Pineau and Doina Precup and David Meger}, title = {Deep Reinforcement Learning that Matters}, journal = {CoRR}, volume = {abs/1709.06560}, year = {2017}, url = {http://arxiv.org/abs/1709.06560}, eprinttype = {arXiv}, eprint = {1709.06560}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-06560.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-06683, author = {Peter Henderson and Wei{-}Di Chang and Pierre{-}Luc Bacon and David Meger and Joelle Pineau and Doina Precup}, title = {OptionGAN: Learning Joint Reward-Policy Options using Generative Adversarial Inverse Reinforcement Learning}, journal = {CoRR}, volume = {abs/1709.06683}, year = {2017}, url = {http://arxiv.org/abs/1709.06683}, eprinttype = {arXiv}, eprint = {1709.06683}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-06683.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-04755, author = {Anirudh Goyal and Nan Rosemary Ke and Alex Lamb and R. Devon Hjelm and Chris Pal and Joelle Pineau and Yoshua Bengio}, title = {ACtuAL: Actor-Critic Under Adversarial Learning}, journal = {CoRR}, volume = {abs/1711.04755}, year = {2017}, url = {http://arxiv.org/abs/1711.04755}, eprinttype = {arXiv}, eprint = {1711.04755}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-04755.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-09050, author = {Peter Henderson and Koustuv Sinha and Nicolas Angelard{-}Gontier and Nan Rosemary Ke and Genevieve Fried and Ryan Lowe and Joelle Pineau}, title = {Ethical Challenges in Data-Driven Dialogue Systems}, journal = {CoRR}, volume = {abs/1711.09050}, year = {2017}, url = {http://arxiv.org/abs/1711.09050}, eprinttype = {arXiv}, eprint = {1711.09050}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-09050.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1712-09520, author = {Xingwei Cao and Guillaume Rabusseau and Joelle Pineau}, title = {Tensor Regression Networks with various Low-Rank Tensor Approximations}, journal = {CoRR}, volume = {abs/1712.09520}, year = {2017}, url = {http://arxiv.org/abs/1712.09520}, eprinttype = {arXiv}, eprint = {1712.09520}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1712-09520.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijsr/KimP16, author = {Beomjoon Kim and Joelle Pineau}, title = {Socially Adaptive Path Planning in Human Environments Using Inverse Reinforcement Learning}, journal = {Int. J. Soc. Robotics}, volume = {8}, number = {1}, pages = {51--66}, year = {2016}, url = {https://doi.org/10.1007/s12369-015-0310-2}, doi = {10.1007/S12369-015-0310-2}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ijsr/KimP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/BarretoPP16, author = {Andr{\'{e}} da Motta Salles Barreto and Doina Precup and Joelle Pineau}, title = {Practical Kernel-Based Reinforcement Learning}, journal = {J. Mach. Learn. Res.}, volume = {17}, pages = {67:1--67:70}, year = {2016}, url = {https://jmlr.org/papers/v17/13-134.html}, timestamp = {Wed, 11 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/BarretoPP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tkde/WangP16, author = {Boyu Wang and Joelle Pineau}, title = {Online Bagging and Boosting for Imbalanced Data Streams}, journal = {{IEEE} Trans. Knowl. Data Eng.}, volume = {28}, number = {12}, pages = {3353--3366}, year = {2016}, url = {https://doi.org/10.1109/TKDE.2016.2609424}, doi = {10.1109/TKDE.2016.2609424}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tkde/WangP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/BarretoBPP16, author = {Andr{\'{e}} da Motta Salles Barreto and Rafael L. Beirigo and Joelle Pineau and Doina Precup}, editor = {Dale Schuurmans and Michael P. Wellman}, title = {Incremental Stochastic Factorization for Online Reinforcement Learning}, booktitle = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence, February 12-17, 2016, Phoenix, Arizona, {USA}}, pages = {1468--1475}, publisher = {{AAAI} Press}, year = {2016}, url = {https://doi.org/10.1609/aaai.v30i1.10311}, doi = {10.1609/AAAI.V30I1.10311}, timestamp = {Mon, 04 Sep 2023 15:08:28 +0200}, biburl = {https://dblp.org/rec/conf/aaai/BarretoBPP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/WangPB16, author = {Boyu Wang and Joelle Pineau and Borja Balle}, editor = {Dale Schuurmans and Michael P. Wellman}, title = {Multitask Generalized Eigenvalue Program}, booktitle = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence, February 12-17, 2016, Phoenix, Arizona, {USA}}, pages = {2115--2121}, publisher = {{AAAI} Press}, year = {2016}, url = {https://doi.org/10.1609/aaai.v30i1.10229}, doi = {10.1609/AAAI.V30I1.10229}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/WangPB16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/SerbanSBCP16, author = {Iulian Vlad Serban and Alessandro Sordoni and Yoshua Bengio and Aaron C. Courville and Joelle Pineau}, editor = {Dale Schuurmans and Michael P. Wellman}, title = {Building End-To-End Dialogue Systems Using Generative Hierarchical Neural Network Models}, booktitle = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence, February 12-17, 2016, Phoenix, Arizona, {USA}}, pages = {3776--3784}, publisher = {{AAAI} Press}, year = {2016}, url = {https://doi.org/10.1609/aaai.v30i1.9883}, doi = {10.1609/AAAI.V30I1.9883}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/SerbanSBCP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/GerdzhevPMVF16, author = {Martin Gerdzhev and Joelle Pineau and Ian M. Mitchell and Pooja Viswanathan and Genevi{\`{e}}ve Foley}, title = {On the Use of Modular Software and Hardware for Designing Wheelchair Robots}, booktitle = {2016 {AAAI} Spring Symposia, Stanford University, Palo Alto, California, USA, March 21-23, 2016}, publisher = {{AAAI} Press}, year = {2016}, url = {http://www.aaai.org/ocs/index.php/SSS/SSS16/paper/view/12704}, timestamp = {Wed, 14 Nov 2018 13:16:02 +0100}, biburl = {https://dblp.org/rec/conf/aaaiss/GerdzhevPMVF16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/LiuLSNCP16, author = {Chia{-}Wei Liu and Ryan Lowe and Iulian Serban and Michael Noseworthy and Laurent Charlin and Joelle Pineau}, editor = {Jian Su and Xavier Carreras and Kevin Duh}, title = {How {NOT} To Evaluate Your Dialogue System: An Empirical Study of Unsupervised Evaluation Metrics for Dialogue Response Generation}, booktitle = {Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4, 2016}, pages = {2122--2132}, publisher = {The Association for Computational Linguistics}, year = {2016}, url = {https://doi.org/10.18653/v1/d16-1230}, doi = {10.18653/V1/D16-1230}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/LiuLSNCP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/ZhouBP16, author = {Chenghui Zhou and Borja Balle and Joelle Pineau}, editor = {Danica Kragic and Antonio Bicchi and Alessandro De Luca}, title = {Learning time series models for pedestrian motion prediction}, booktitle = {2016 {IEEE} International Conference on Robotics and Automation, {ICRA} 2016, Stockholm, Sweden, May 16-21, 2016}, pages = {3323--3330}, publisher = {{IEEE}}, year = {2016}, url = {https://doi.org/10.1109/ICRA.2016.7487506}, doi = {10.1109/ICRA.2016.7487506}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/icra/ZhouBP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/WangP16, author = {Boyu Wang and Joelle Pineau}, editor = {Subbarao Kambhampati}, title = {Generalized Dictionary for Multitask Learning with Boosting}, booktitle = {Proceedings of the Twenty-Fifth International Joint Conference on Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July 2016}, pages = {2097--2103}, publisher = {{IJCAI/AAAI} Press}, year = {2016}, url = {http://www.ijcai.org/Abstract/16/299}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ijcai/WangP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/mlhc/ThodoroffPL16, author = {Pierre Thodoroff and Joelle Pineau and Andrew Lim}, editor = {Finale Doshi{-}Velez and Jim Fackler and David C. Kale and Byron C. Wallace and Jenna Wiens}, title = {Learning Robust Features using Deep Learning for Automatic Seizure Detection}, booktitle = {Proceedings of the 1st Machine Learning in Health Care, {MLHC} 2016, Los Angeles, CA, USA, August 19-20, 2016}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {56}, pages = {178--190}, publisher = {JMLR.org}, year = {2016}, url = {http://proceedings.mlr.press/v56/Thodoroff16.html}, timestamp = {Wed, 17 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/mlhc/ThodoroffPL16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigdial/LoweSNCP16, author = {Ryan Lowe and Iulian Vlad Serban and Michael Noseworthy and Laurent Charlin and Joelle Pineau}, title = {On the Evaluation of Dialogue Systems with Next Utterance Classification}, booktitle = {Proceedings of the {SIGDIAL} 2016 Conference, The 17th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 13-15 September 2016, Los Angeles, CA, {USA}}, pages = {264--269}, publisher = {The Association for Computer Linguistics}, year = {2016}, url = {https://doi.org/10.18653/v1/w16-3634}, doi = {10.18653/V1/W16-3634}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sigdial/LoweSNCP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LiuLSNCP16, author = {Chia{-}Wei Liu and Ryan Lowe and Iulian Vlad Serban and Michael Noseworthy and Laurent Charlin and Joelle Pineau}, title = {How {NOT} To Evaluate Your Dialogue System: An Empirical Study of Unsupervised Evaluation Metrics for Dialogue Response Generation}, journal = {CoRR}, volume = {abs/1603.08023}, year = {2016}, url = {http://arxiv.org/abs/1603.08023}, eprinttype = {arXiv}, eprint = {1603.08023}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LiuLSNCP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LoweSNCP16, author = {Ryan Lowe and Iulian Vlad Serban and Michael Noseworthy and Laurent Charlin and Joelle Pineau}, title = {On the Evaluation of Dialogue Systems with Next Utterance Classification}, journal = {CoRR}, volume = {abs/1605.05414}, year = {2016}, url = {http://arxiv.org/abs/1605.05414}, eprinttype = {arXiv}, eprint = {1605.05414}, timestamp = {Thu, 13 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LoweSNCP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SerbanSLCPCB16, author = {Iulian Vlad Serban and Alessandro Sordoni and Ryan Lowe and Laurent Charlin and Joelle Pineau and Aaron C. Courville and Yoshua Bengio}, title = {A Hierarchical Latent Variable Encoder-Decoder Model for Generating Dialogues}, journal = {CoRR}, volume = {abs/1605.06069}, year = {2016}, url = {http://arxiv.org/abs/1605.06069}, eprinttype = {arXiv}, eprint = {1605.06069}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SerbanSLCPCB16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BahdanauBXGLPCB16, author = {Dzmitry Bahdanau and Philemon Brakel and Kelvin Xu and Anirudh Goyal and Ryan Lowe and Joelle Pineau and Aaron C. Courville and Yoshua Bengio}, title = {An Actor-Critic Algorithm for Sequence Prediction}, journal = {CoRR}, volume = {abs/1607.07086}, year = {2016}, url = {http://arxiv.org/abs/1607.07086}, eprinttype = {arXiv}, eprint = {1607.07086}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BahdanauBXGLPCB16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/ThodoroffPL16, author = {Pierre Thodoroff and Joelle Pineau and Andrew Lim}, title = {Learning Robust Features using Deep Learning for Automatic Seizure Detection}, journal = {CoRR}, volume = {abs/1608.00220}, year = {2016}, url = {http://arxiv.org/abs/1608.00220}, eprinttype = {arXiv}, eprint = {1608.00220}, timestamp = {Wed, 17 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/ThodoroffPL16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/GhavamzadehMPT16, author = {Mohammad Ghavamzadeh and Shie Mannor and Joelle Pineau and Aviv Tamar}, title = {Bayesian Reinforcement Learning: {A} Survey}, journal = {CoRR}, volume = {abs/1609.04436}, year = {2016}, url = {http://arxiv.org/abs/1609.04436}, eprinttype = {arXiv}, eprint = {1609.04436}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/GhavamzadehMPT16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SerbanLCP16, author = {Iulian Vlad Serban and Ryan Lowe and Laurent Charlin and Joelle Pineau}, title = {Generative Deep Neural Networks for Dialogue: {A} Short Review}, journal = {CoRR}, volume = {abs/1611.06216}, year = {2016}, url = {http://arxiv.org/abs/1611.06216}, eprinttype = {arXiv}, eprint = {1611.06216}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SerbanLCP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SerbanOPC16, author = {Iulian Vlad Serban and Alexander G. Ororbia II and Joelle Pineau and Aaron C. Courville}, title = {Multi-modal Variational Encoder-Decoders}, journal = {CoRR}, volume = {abs/1612.00377}, year = {2016}, url = {http://arxiv.org/abs/1612.00377}, eprinttype = {arXiv}, eprint = {1612.00377}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SerbanOPC16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ftml/GhavamzadehMPT15, author = {Mohammad Ghavamzadeh and Shie Mannor and Joelle Pineau and Aviv Tamar}, title = {Bayesian Reinforcement Learning: {A} Survey}, journal = {Found. Trends Mach. Learn.}, volume = {8}, number = {5-6}, pages = {359--483}, year = {2015}, url = {https://doi.org/10.1561/2200000049}, doi = {10.1561/2200000049}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ftml/GhavamzadehMPT15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/WangP15, author = {Boyu Wang and Joelle Pineau}, editor = {Blai Bonet and Sven Koenig}, title = {Online Boosting Algorithms for Anytime Transfer and Multitask Learning}, booktitle = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence, January 25-30, 2015, Austin, Texas, {USA}}, pages = {3038--3044}, publisher = {{AAAI} Press}, year = {2015}, url = {https://doi.org/10.1609/aaai.v29i1.9607}, doi = {10.1609/AAAI.V29I1.9607}, timestamp = {Mon, 18 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/WangP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/MaP15, author = {Hang Ma and Joelle Pineau}, editor = {Blai Bonet and Sven Koenig}, title = {Information Gathering and Reward Exploitation of Subgoals for POMDPs}, booktitle = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence, January 25-30, 2015, Austin, Texas, {USA}}, pages = {3320--3326}, publisher = {{AAAI} Press}, year = {2015}, url = {https://doi.org/10.1609/aaai.v29i1.9659}, doi = {10.1609/AAAI.V29I1.9659}, timestamp = {Mon, 18 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/MaP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/DurandP15, author = {Audrey Durand and Joelle Pineau}, title = {Adaptive Treatment Allocation Using Sub-Sampled Gaussian Processes}, booktitle = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14, 2015}, pages = {9--11}, publisher = {{AAAI} Press}, year = {2015}, url = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11671}, timestamp = {Wed, 14 Nov 2018 16:20:12 +0100}, biburl = {https://dblp.org/rec/conf/aaaifs/DurandP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/SutcliffeTP15, author = {Andrew Sutcliffe and Neil A. Tenenholtz and Joelle Pineau}, title = {Missteps in Robot Social Navigation}, booktitle = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14, 2015}, pages = {134--136}, publisher = {{AAAI} Press}, year = {2015}, url = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11679}, timestamp = {Sun, 09 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaaifs/SutcliffeTP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aips/Pineau15, author = {Joelle Pineau}, editor = {Ronen I. Brafman and Carmel Domshlak and Patrik Haslum and Shlomo Zilberstein}, title = {Improving the Design and Discovery of Dynamic Treatment Strategies Using Recent Results in Sequential Decision-Making}, booktitle = {Proceedings of the Twenty-Fifth International Conference on Automated Planning and Scheduling, {ICAPS} 2015, Jerusalem, Israel, June 7-11, 2015}, pages = {373}, publisher = {{AAAI} Press}, year = {2015}, url = {http://www.aaai.org/ocs/index.php/ICAPS/ICAPS15/paper/view/10637}, timestamp = {Tue, 26 May 2015 21:03:02 +0200}, biburl = {https://dblp.org/rec/conf/aips/Pineau15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/PineauB15, author = {Joelle Pineau and Pierre{-}Luc Bacon}, editor = {Ioannis Katakis and Fran{\c{c}}ois Schnitzler and Thomas Liebig and Dimitrios Gunopulos and Katharina Morik and Gennady L. Andrienko and Shie Mannor}, title = {Analyzing Open Data from the City of Montreal}, booktitle = {Proceedings of the 2nd International Workshop on Mining Urban Data co-located with 32nd International Conference on Machine Learning {(ICML} 2015), Lille, France, July 11th, 2015}, series = {{CEUR} Workshop Proceedings}, volume = {1392}, pages = {11--16}, publisher = {CEUR-WS.org}, year = {2015}, url = {https://ceur-ws.org/Vol-1392/paper-02.pdf}, timestamp = {Fri, 10 Mar 2023 16:22:13 +0100}, biburl = {https://dblp.org/rec/conf/icml/PineauB15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/LeighPOZ15, author = {Angus Leigh and Joelle Pineau and Nicolas A. Olmedo and Hong Zhang}, title = {Person tracking and following with 2D laser scanners}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2015, Seattle, WA, USA, 26-30 May, 2015}, pages = {726--733}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/ICRA.2015.7139259}, doi = {10.1109/ICRA.2015.7139259}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/icra/LeighPOZ15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/BarretoBPP15, author = {Andr{\'{e}} da Motta Salles Barreto and Rafael L. Beirigo and Joelle Pineau and Doina Precup}, editor = {Qiang Yang and Michael J. Wooldridge}, title = {An Expectation-Maximization Algorithm to Compute a Stochastic Factorization From Data}, booktitle = {Proceedings of the Twenty-Fourth International Joint Conference on Artificial Intelligence, {IJCAI} 2015, Buenos Aires, Argentina, July 25-31, 2015}, pages = {3329--3336}, publisher = {{AAAI} Press}, year = {2015}, url = {http://ijcai.org/Abstract/15/469}, timestamp = {Tue, 20 Aug 2019 16:16:43 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/BarretoBPP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/YuenPA15, author = {HiuKim Yuen and Joelle Pineau and Philippe S. Archambault}, title = {Automatically characterizing driving activities onboard smart wheelchairs from accelerometer data}, booktitle = {2015 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2015, Hamburg, Germany, September 28 - October 2, 2015}, pages = {5011--5018}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/IROS.2015.7354082}, doi = {10.1109/IROS.2015.7354082}, timestamp = {Fri, 26 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iros/YuenPA15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigdial/LowePSP15, author = {Ryan Lowe and Nissan Pow and Iulian Serban and Joelle Pineau}, title = {The Ubuntu Dialogue Corpus: {A} Large Dataset for Research in Unstructured Multi-Turn Dialogue Systems}, booktitle = {Proceedings of the {SIGDIAL} 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic}, pages = {285--294}, publisher = {The Association for Computer Linguistics}, year = {2015}, url = {https://doi.org/10.18653/v1/w15-4640}, doi = {10.18653/V1/W15-4640}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sigdial/LowePSP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LowePSP15, author = {Ryan Lowe and Nissan Pow and Iulian Serban and Joelle Pineau}, title = {The Ubuntu Dialogue Corpus: {A} Large Dataset for Research in Unstructured Multi-Turn Dialogue Systems}, journal = {CoRR}, volume = {abs/1506.08909}, year = {2015}, url = {http://arxiv.org/abs/1506.08909}, eprinttype = {arXiv}, eprint = {1506.08909}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LowePSP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SerbanSBCP15, author = {Iulian Vlad Serban and Alessandro Sordoni and Yoshua Bengio and Aaron C. Courville and Joelle Pineau}, title = {Hierarchical Neural Network Generative Models for Movie Dialogues}, journal = {CoRR}, volume = {abs/1507.04808}, year = {2015}, url = {http://arxiv.org/abs/1507.04808}, eprinttype = {arXiv}, eprint = {1507.04808}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SerbanSBCP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BengioBPP15, author = {Emmanuel Bengio and Pierre{-}Luc Bacon and Joelle Pineau and Doina Precup}, title = {Conditional Computation in Neural Networks for faster models}, journal = {CoRR}, volume = {abs/1511.06297}, year = {2015}, url = {http://arxiv.org/abs/1511.06297}, eprinttype = {arXiv}, eprint = {1511.06297}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/BengioBPP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SerbanLCP15, author = {Iulian Vlad Serban and Ryan Lowe and Peter Henderson and Laurent Charlin and Joelle Pineau}, title = {A Survey of Available Corpora for Building Data-Driven Dialogue Systems}, journal = {CoRR}, volume = {abs/1512.05742}, year = {2015}, url = {http://arxiv.org/abs/1512.05742}, eprinttype = {arXiv}, eprint = {1512.05742}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SerbanLCP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/BarretoPP14, author = {Andr{\'{e}} da Motta Salles Barreto and Joelle Pineau and Doina Precup}, title = {Policy Iteration Based on Stochastic Factorization}, journal = {J. Artif. Intell. Res.}, volume = {50}, pages = {763--803}, year = {2014}, url = {https://doi.org/10.1613/jair.4301}, doi = {10.1613/JAIR.4301}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jair/BarretoPP14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/HamiltonFP14, author = {William L. Hamilton and Mahdi Milani Fard and Joelle Pineau}, title = {Efficient learning and planning with compressed predictive states}, journal = {J. Mach. Learn. Res.}, volume = {15}, number = {1}, pages = {3395--3439}, year = {2014}, url = {https://dl.acm.org/doi/10.5555/2627435.2750354}, doi = {10.5555/2627435.2750354}, timestamp = {Thu, 02 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/HamiltonFP14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/SutcliffeGP14, author = {Andrew Sutcliffe and Daniel H. Grollman and Joelle Pineau}, title = {Estimating People's Subjective Experiences of Robot Behavior}, booktitle = {2014 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 13-15, 2014}, publisher = {{AAAI} Press}, year = {2014}, url = {http://www.aaai.org/ocs/index.php/FSS/FSS14/paper/view/9148}, timestamp = {Wed, 14 Nov 2018 17:08:03 +0100}, biburl = {https://dblp.org/rec/conf/aaaifs/SutcliffeGP14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/BalleHP14, author = {Borja Balle and William L. Hamilton and Joelle Pineau}, title = {Methods of Moments for Learning Stochastic Languages: Unified Presentation and Empirical Comparison}, booktitle = {Proceedings of the 31th International Conference on Machine Learning, {ICML} 2014, Beijing, China, 21-26 June 2014}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {32}, pages = {1386--1394}, publisher = {JMLR.org}, year = {2014}, url = {http://proceedings.mlr.press/v32/balle14.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/BalleHP14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/AlsharifP13, author = {Ouais Alsharif and Joelle Pineau}, editor = {Yoshua Bengio and Yann LeCun}, title = {End-to-End Text Recognition with Hybrid {HMM} Maxout Models}, booktitle = {2nd International Conference on Learning Representations, {ICLR} 2014, Banff, AB, Canada, April 14-16, 2014, Workshop Track Proceedings}, year = {2014}, url = {http://arxiv.org/abs/1310.1811}, timestamp = {Thu, 04 Apr 2019 13:20:06 +0200}, biburl = {https://dblp.org/rec/journals/corr/AlsharifP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/RossPPC14, author = {St{\'{e}}phane Ross and Joelle Pineau and S{\'{e}}bastien Paquet and Brahim Chaib{-}draa}, title = {Online Planning Algorithms for POMDPs}, journal = {CoRR}, volume = {abs/1401.3436}, year = {2014}, url = {http://arxiv.org/abs/1401.3436}, eprinttype = {arXiv}, eprint = {1401.3436}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/RossPPC14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/FardP14, author = {Mahdi Milani Fard and Joelle Pineau}, title = {Non-Deterministic Policies in Markovian Decision Processes}, journal = {CoRR}, volume = {abs/1401.3871}, year = {2014}, url = {http://arxiv.org/abs/1401.3871}, eprinttype = {arXiv}, eprint = {1401.3871}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/FardP14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/AlsharifBP14, author = {Ouais Alsharif and Philip Bachman and Joelle Pineau}, title = {Lifelong Learning of Discriminative Representations}, journal = {CoRR}, volume = {abs/1404.4108}, year = {2014}, url = {http://arxiv.org/abs/1404.4108}, eprinttype = {arXiv}, eprint = {1404.4108}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/AlsharifBP14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BarretoPP14, author = {Andr{\'{e}} da Motta Salles Barreto and Doina Precup and Joelle Pineau}, title = {Practical Kernel-Based Reinforcement Learning}, journal = {CoRR}, volume = {abs/1407.5358}, year = {2014}, url = {http://arxiv.org/abs/1407.5358}, eprinttype = {arXiv}, eprint = {1407.5358}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BarretoPP14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/ShaniPK13, author = {Guy Shani and Joelle Pineau and Robert Kaplow}, title = {A survey of point-based {POMDP} solvers}, journal = {Auton. Agents Multi Agent Syst.}, volume = {27}, number = {1}, pages = {1--51}, year = {2013}, url = {https://doi.org/10.1007/s10458-012-9200-2}, doi = {10.1007/S10458-012-9200-2}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aamas/ShaniPK13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pami/FrankMPP13, author = {Jordan Frank and Shie Mannor and Joelle Pineau and Doina Precup}, title = {Time Series Analysis Using Geometric Template Matching}, journal = {{IEEE} Trans. Pattern Anal. Mach. Intell.}, volume = {35}, number = {3}, pages = {740--754}, year = {2013}, url = {https://doi.org/10.1109/TPAMI.2012.121}, doi = {10.1109/TPAMI.2012.121}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pami/FrankMPP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/OngGP13, author = {Sylvie C. W. Ong and Yuri Grinberg and Joelle Pineau}, editor = {Marie desJardins and Michael L. Littman}, title = {Mixed Observability Predictive State Representations}, booktitle = {Proceedings of the Twenty-Seventh {AAAI} Conference on Artificial Intelligence, July 14-18, 2013, Bellevue, Washington, {USA}}, pages = {746--752}, publisher = {{AAAI} Press}, year = {2013}, url = {https://doi.org/10.1609/aaai.v27i1.8680}, doi = {10.1609/AAAI.V27I1.8680}, timestamp = {Mon, 04 Sep 2023 15:56:33 +0200}, biburl = {https://dblp.org/rec/conf/aaai/OngGP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/Pineau13, author = {Joelle Pineau}, title = {Designing Intelligent Wheelchairs: Reintegrating {AI}}, booktitle = {Designing Intelligent Robots: Reintegrating {AI} II, Papers from the 2013 {AAAI} Spring Symposium, Palo Alto, California, USA, March 25-27, 2013}, series = {{AAAI} Technical Report}, volume = {{SS-13-04}}, publisher = {{AAAI}}, year = {2013}, url = {http://www.aaai.org/ocs/index.php/SSS/SSS13/paper/view/5783}, timestamp = {Mon, 09 Sep 2013 15:13:13 +0200}, biburl = {https://dblp.org/rec/conf/aaaiss/Pineau13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/HamiltonFP13, author = {William L. Hamilton and Mahdi Milani Fard and Joelle Pineau}, title = {Modelling Sparse Dynamical Systems with Compressed Predictive State Representations}, booktitle = {Proceedings of the 30th International Conference on Machine Learning, {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {28}, pages = {178--186}, publisher = {JMLR.org}, year = {2013}, url = {http://proceedings.mlr.press/v28/hamilton13.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/HamiltonFP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/KimFPP13, author = {Beomjoon Kim and Amir{-}massoud Farahmand and Joelle Pineau and Doina Precup}, editor = {Christopher J. C. Burges and L{\'{e}}on Bottou and Zoubin Ghahramani and Kilian Q. Weinberger}, title = {Learning from Limited Demonstrations}, booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual Conference on Neural Information Processing Systems 2013. Proceedings of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States}, pages = {2859--2867}, year = {2013}, url = {https://proceedings.neurips.cc/paper/2013/hash/fd5c905bcd8c3348ad1b35d7231ee2b1-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/KimFPP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/FardGFPP13, author = {Mahdi Milani Fard and Yuri Grinberg and Amir{-}massoud Farahmand and Joelle Pineau and Doina Precup}, editor = {Christopher J. C. Burges and L{\'{e}}on Bottou and Zoubin Ghahramani and Kilian Q. Weinberger}, title = {Bellman Error Based Feature Generation using Random Projections on Sparse Spaces}, booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual Conference on Neural Information Processing Systems 2013. Proceedings of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States}, pages = {3030--3038}, year = {2013}, url = {https://proceedings.neurips.cc/paper/2013/hash/86e8f7ab32cfd12577bc2619bc635690-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/FardGFPP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/rss/KimP13, author = {Beomjoon Kim and Joelle Pineau}, editor = {Paul Newman and Dieter Fox and David Hsu}, title = {Maximum Mean Discrepancy Imitation Learning}, booktitle = {Robotics: Science and Systems IX, Technische Universit{\"{a}}t Berlin, Berlin, Germany, June 24 - June 28, 2013}, year = {2013}, url = {http://www.roboticsproceedings.org/rss09/p38.html}, doi = {10.15607/RSS.2013.IX.038}, timestamp = {Fri, 29 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/rss/KimP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/WangP13, author = {Boyu Wang and Joelle Pineau}, title = {Online Ensemble Learning for Imbalanced Data Streams}, journal = {CoRR}, volume = {abs/1310.8004}, year = {2013}, url = {http://arxiv.org/abs/1310.8004}, eprinttype = {arXiv}, eprint = {1310.8004}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/WangP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/HamiltonFP13, author = {William L. Hamilton and Mahdi Milani Fard and Joelle Pineau}, title = {Efficient Learning and Planning with Compressed Predictive States}, journal = {CoRR}, volume = {abs/1312.0286}, year = {2013}, url = {http://arxiv.org/abs/1312.0286}, eprinttype = {arXiv}, eprint = {1312.0286}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/HamiltonFP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/Doshi-VelezPR12, author = {Finale Doshi{-}Velez and Joelle Pineau and Nicholas Roy}, title = {Reinforcement learning with limited reinforcement: Using Bayes risk for active learning in POMDPs}, journal = {Artif. Intell.}, volume = {187}, pages = {115--132}, year = {2012}, url = {https://doi.org/10.1016/j.artint.2012.04.006}, doi = {10.1016/J.ARTINT.2012.04.006}, timestamp = {Sat, 27 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ai/Doshi-VelezPR12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jstsp/PngPC12, author = {ShaoWei Png and Joelle Pineau and Brahim Chaib{-}draa}, title = {Building Adaptive Dialogue Systems Via Bayes-Adaptive POMDPs}, journal = {{IEEE} J. Sel. Top. Signal Process.}, volume = {6}, number = {8}, pages = {917--927}, year = {2012}, url = {https://doi.org/10.1109/JSTSP.2012.2229962}, doi = {10.1109/JSTSP.2012.2229962}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jstsp/PngPC12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/FardGPP12, author = {Mahdi Milani Fard and Yuri Grinberg and Joelle Pineau and Doina Precup}, editor = {J{\"{o}}rg Hoffmann and Bart Selman}, title = {Compressed Least-Squares Regression on Sparse Spaces}, booktitle = {Proceedings of the Twenty-Sixth {AAAI} Conference on Artificial Intelligence, July 22-26, 2012, Toronto, Ontario, Canada}, pages = {1054--1060}, publisher = {{AAAI} Press}, year = {2012}, url = {https://doi.org/10.1609/aaai.v26i1.8303}, doi = {10.1609/AAAI.V26I1.8303}, timestamp = {Mon, 04 Sep 2023 15:56:47 +0200}, biburl = {https://dblp.org/rec/conf/aaai/FardGPP12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/crv/TsangOP12, author = {Emily Tsang and Sylvie C. W. Ong and Joelle Pineau}, title = {Design and Evaluation of a Flexible Interface for Spatial Navigation}, booktitle = {Ninth Conference on Computer and Robot Vision, {CRV} 2012, Toronto, Ontario, Canada, May 28-30, 2012}, pages = {353--360}, publisher = {{IEEE} Computer Society}, year = {2012}, url = {https://doi.org/10.1109/CRV.2012.53}, doi = {10.1109/CRV.2012.53}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/crv/TsangOP12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ewrl/PaduraruPPC12, author = {Cosmin Paduraru and Doina Precup and Joelle Pineau and Gheorghe Comanici}, editor = {Marc Peter Deisenroth and Csaba Szepesv{\'{a}}ri and Jan Peters}, title = {An Empirical Analysis of Off-policy Learning in Discrete MDPs}, booktitle = {Proceedings of the Tenth European Workshop on Reinforcement Learning, {EWRL} 2012, Edinburgh, Scotland, UK, June, 2012}, series = {{JMLR} Proceedings}, volume = {24}, pages = {89--102}, publisher = {JMLR.org}, year = {2012}, url = {http://proceedings.mlr.press/v24/paduraru12a.html}, timestamp = {Wed, 29 May 2019 08:41:44 +0200}, biburl = {https://dblp.org/rec/conf/ewrl/PaduraruPPC12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BarretoPP12, author = {Andr{\'{e}} da Motta Salles Barreto and Doina Precup and Joelle Pineau}, editor = {Peter L. Bartlett and Fernando C. N. Pereira and Christopher J. C. Burges and L{\'{e}}on Bottou and Kilian Q. Weinberger}, title = {On-line Reinforcement Learning Using Incremental Kernel-Based Stochastic Factorization}, booktitle = {Advances in Neural Information Processing Systems 25: 26th Annual Conference on Neural Information Processing Systems 2012. Proceedings of a meeting held December 3-6, 2012, Lake Tahoe, Nevada, United States}, pages = {1493--1501}, year = {2012}, url = {https://proceedings.neurips.cc/paper/2012/hash/1ecfb463472ec9115b10c292ef8bc986-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/BarretoPP12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1202-3714, author = {Kun Deng and Joelle Pineau and Susan A. Murphy}, title = {Active Learning for Developing Personalized Treatment}, journal = {CoRR}, volume = {abs/1202.3714}, year = {2012}, url = {http://arxiv.org/abs/1202.3714}, eprinttype = {arXiv}, eprint = {1202.3714}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1202-3714.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1202-3717, author = {Mahdi Milani Fard and Joelle Pineau and Csaba Szepesv{\'{a}}ri}, title = {PAC-Bayesian Policy Evaluation for Reinforcement Learning}, journal = {CoRR}, volume = {abs/1202.3717}, year = {2012}, url = {http://arxiv.org/abs/1202.3717}, eprinttype = {arXiv}, eprint = {1202.3717}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1202-3717.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1206-3281, author = {St{\'{e}}phane Ross and Joelle Pineau}, title = {Model-Based Bayesian Reinforcement Learning in Large Structured Domains}, journal = {CoRR}, volume = {abs/1206.3281}, year = {2012}, url = {http://arxiv.org/abs/1206.3281}, eprinttype = {arXiv}, eprint = {1206.3281}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1206-3281.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1207-4676, author = {John Langford and Joelle Pineau}, title = {Proceedings of the 29th International Conference on Machine Learning {(ICML-12)}}, journal = {CoRR}, volume = {abs/1207.4676}, year = {2012}, url = {http://arxiv.org/abs/1207.4676}, eprinttype = {arXiv}, eprint = {1207.4676}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1207-4676.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1207-5554, author = {Mahdi Milani Fard and Yuri Grinberg and Amir Massoud Farahmand and Joelle Pineau and Doina Precup}, title = {Bellman Error Based Feature Generation using Random Projections on Sparse Spaces}, journal = {CoRR}, volume = {abs/1207.5554}, year = {2012}, url = {http://arxiv.org/abs/1207.5554}, eprinttype = {arXiv}, eprint = {1207.5554}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1207-5554.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1212-2495, author = {Joelle Pineau and Geoffrey J. Gordon and Sebastian Thrun}, title = {Policy-contingent abstraction for robust robot control}, journal = {CoRR}, volume = {abs/1212.2495}, year = {2012}, url = {http://arxiv.org/abs/1212.2495}, eprinttype = {arXiv}, eprint = {1212.2495}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1212-2495.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/FardP11, author = {Mahdi Milani Fard and Joelle Pineau}, title = {Non-Deterministic Policies in Markovian Decision Processes}, journal = {J. Artif. Intell. Res.}, volume = {40}, pages = {1--24}, year = {2011}, url = {https://doi.org/10.1613/jair.3175}, doi = {10.1613/JAIR.3175}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jair/FardP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/RossPCK11, author = {St{\'{e}}phane Ross and Joelle Pineau and Brahim Chaib{-}draa and Pierre Kreitmann}, title = {A Bayesian Approach for Learning and Planning in Partially Observable Markov Decision Processes}, journal = {J. Mach. Learn. Res.}, volume = {12}, pages = {1729--1770}, year = {2011}, url = {https://dl.acm.org/doi/10.5555/1953048.2021055}, doi = {10.5555/1953048.2021055}, timestamp = {Thu, 02 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/RossPCK11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ml/ShortreedLLSPM11, author = {Susan M. Shortreed and Eric B. Laber and Daniel J. Lizotte and T. Scott Stroup and Joelle Pineau and Susan A. Murphy}, title = {Informing sequential clinical decision-making through reinforcement learning: an empirical study}, journal = {Mach. Learn.}, volume = {84}, number = {1-2}, pages = {109--136}, year = {2011}, url = {https://doi.org/10.1007/s10994-010-5229-0}, doi = {10.1007/S10994-010-5229-0}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ml/ShortreedLLSPM11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/nn/VincentCP11, author = {Robert D. Vincent and Aaron C. Courville and Joelle Pineau}, title = {A bistable computational model of recurring epileptiform activity as observed in rodent slice preparations}, journal = {Neural Networks}, volume = {24}, number = {6}, pages = {526--537}, year = {2011}, url = {https://doi.org/10.1016/j.neunet.2011.03.003}, doi = {10.1016/J.NEUNET.2011.03.003}, timestamp = {Wed, 14 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/nn/VincentCP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/SaulnierP11, author = {Guillaume Saulnier and Joelle Pineau}, title = {Automatic Seizure Detection in an In-Vivo Model of Epilepsy}, booktitle = {Computational Physiology, Papers from the 2011 {AAAI} Spring Symposium, Technical Report SS-11-04, Stanford, California, USA, March 21-23, 2011}, publisher = {{AAAI}}, year = {2011}, url = {http://www.aaai.org/ocs/index.php/SSS/SSS11/paper/view/2468}, timestamp = {Mon, 13 Feb 2012 17:06:00 +0100}, biburl = {https://dblp.org/rec/conf/aaaiss/SaulnierP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/adprl/DengPM11, author = {Kun Deng and Joelle Pineau and Susan A. Murphy}, title = {Active learning for personalizing treatment}, booktitle = {2011 {IEEE} Symposium on Adaptive Dynamic Programming And Reinforcement Learning, {ADPRL} 2011, Paris, France, April 12-14, 2011}, pages = {32--39}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ADPRL.2011.5967348}, doi = {10.1109/ADPRL.2011.5967348}, timestamp = {Wed, 16 Oct 2019 14:14:48 +0200}, biburl = {https://dblp.org/rec/conf/adprl/DengPM11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/embc/MoghaddamPFARAP11, author = {Athena K. Moghaddam and Joelle Pineau and Jordan Frank and Philippe S. Archambault and Fran{\c{c}}ois Routhier and Therese Audet and Jan Polgar and Fran{\c{c}}ois Michaud and Patrick Boissy}, title = {Mobility profile and wheelchair driving skills of powered wheelchair users: Sensor-based event recognition using a support vector machine classifier}, booktitle = {33rd Annual International Conference of the {IEEE} Engineering in Medicine and Biology Society, {EMBC} 2011, Boston, MA, USA, August 30 - Sept. 3, 2011}, pages = {7336--7339}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/IEMBS.2011.6091711}, doi = {10.1109/IEMBS.2011.6091711}, timestamp = {Fri, 26 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/embc/MoghaddamPFARAP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ewrl/OngGP11, author = {Sylvie C. W. Ong and Yuri Grinberg and Joelle Pineau}, editor = {Scott Sanner and Marcus Hutter}, title = {Goal-Directed Online Learning of Predictive Models}, booktitle = {Recent Advances in Reinforcement Learning - 9th European Workshop, {EWRL} 2011, Athens, Greece, September 9-11, 2011, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {7188}, pages = {18--29}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-29946-9\_6}, doi = {10.1007/978-3-642-29946-9\_6}, timestamp = {Tue, 14 May 2019 10:00:48 +0200}, biburl = {https://dblp.org/rec/conf/ewrl/OngGP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ewrl/PaduraruPP11, author = {Cosmin Paduraru and Doina Precup and Joelle Pineau}, editor = {Scott Sanner and Marcus Hutter}, title = {A Framework for Computing Bounds for the Return of a Policy}, booktitle = {Recent Advances in Reinforcement Learning - 9th European Workshop, {EWRL} 2011, Athens, Greece, September 9-11, 2011, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {7188}, pages = {201--212}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-29946-9\_21}, doi = {10.1007/978-3-642-29946-9\_21}, timestamp = {Tue, 23 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ewrl/PaduraruPP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/PngP11, author = {ShaoWei Png and Joelle Pineau}, title = {Bayesian reinforcement learning for POMDP-based dialogue systems}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress Center, Prague, Czech Republic}, pages = {2156--2159}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ICASSP.2011.5946754}, doi = {10.1109/ICASSP.2011.5946754}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/PngP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BarretoPP11, author = {Andr{\'{e}} da Motta Salles Barreto and Doina Precup and Joelle Pineau}, editor = {John Shawe{-}Taylor and Richard S. Zemel and Peter L. Bartlett and Fernando C. N. Pereira and Kilian Q. Weinberger}, title = {Reinforcement Learning using Kernel-Based Stochastic Factorization}, booktitle = {Advances in Neural Information Processing Systems 24: 25th Annual Conference on Neural Information Processing Systems 2011. Proceedings of a meeting held 12-14 December 2011, Granada, Spain}, pages = {720--728}, year = {2011}, url = {https://proceedings.neurips.cc/paper/2011/hash/b534ba68236ba543ae44b22bd110a1d6-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/BarretoPP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/tbillc/DinculescuHPPP11, author = {Monica Dinculescu and Christopher Hundt and Prakash Panangaden and Joelle Pineau and Doina Precup}, editor = {Guram Bezhanishvili and Sebastian L{\"{o}}bner and Vincenzo Marra and Frank Richter}, title = {The Duality of State and Observation in Probabilistic Transition Systems}, booktitle = {Logic, Language, and Computation - 9th International Tbilisi Symposium on Logic, Language, and Computation, TbiLLC 2011, Kutaisi, Georgia, September 26-30, 2011, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {7758}, pages = {206--230}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-36976-6\_14}, doi = {10.1007/978-3-642-36976-6\_14}, timestamp = {Tue, 14 May 2019 10:00:54 +0200}, biburl = {https://dblp.org/rec/conf/tbillc/DinculescuHPPP11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uai/DengPM11, author = {Kun Deng and Joelle Pineau and Susan A. Murphy}, editor = {F{\'{a}}bio Gagliardi Cozman and Avi Pfeffer}, title = {Active Learning for Developing Personalized Treatment}, booktitle = {{UAI} 2011, Proceedings of the Twenty-Seventh Conference on Uncertainty in Artificial Intelligence, Barcelona, Spain, July 14-17, 2011}, pages = {161--168}, publisher = {{AUAI} Press}, year = {2011}, url = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=2196\&\#38;proceeding\_id=27}, timestamp = {Wed, 03 Feb 2021 11:09:03 +0100}, biburl = {https://dblp.org/rec/conf/uai/DengPM11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uai/FardPS11, author = {Mahdi Milani Fard and Joelle Pineau and Csaba Szepesv{\'{a}}ri}, editor = {F{\'{a}}bio Gagliardi Cozman and Avi Pfeffer}, title = {PAC-Bayesian Policy Evaluation for Reinforcement Learning}, booktitle = {{UAI} 2011, Proceedings of the Twenty-Seventh Conference on Uncertainty in Artificial Intelligence, Barcelona, Spain, July 14-17, 2011}, pages = {195--202}, publisher = {{AUAI} Press}, year = {2011}, url = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=2218\&\#38;proceeding\_id=27}, timestamp = {Wed, 03 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/uai/FardPS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1110-0027, author = {Joelle Pineau and Geoffrey J. Gordon and Sebastian Thrun}, title = {Anytime Point-Based Approximations for Large POMDPs}, journal = {CoRR}, volume = {abs/1110.0027}, year = {2011}, url = {http://arxiv.org/abs/1110.0027}, eprinttype = {arXiv}, eprint = {1110.0027}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1110-0027.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/BushP10, author = {Keith Bush and Joelle Pineau}, title = {Treating Epilepsy by Reinforcement Learning Via Manifold-Based Simulation}, booktitle = {Manifold Learning and Its Applications, Papers from the 2010 {AAAI} Fall Symposium, Arlington, Virginia, USA, November 11-13, 2010}, series = {{AAAI} Technical Report}, volume = {{FS-10-06}}, publisher = {{AAAI}}, year = {2010}, url = {http://www.aaai.org/ocs/index.php/FSS/FSS10/paper/view/2263}, timestamp = {Thu, 26 Sep 2013 15:55:57 +0200}, biburl = {https://dblp.org/rec/conf/aaaifs/BushP10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cikm/WestPP10, author = {Robert West and Doina Precup and Joelle Pineau}, editor = {Jimmy X. Huang and Nick Koudas and Gareth J. F. Jones and Xindong Wu and Kevyn Collins{-}Thompson and Aijun An}, title = {Automatically suggesting topics for augmenting text documents}, booktitle = {Proceedings of the 19th {ACM} Conference on Information and Knowledge Management, {CIKM} 2010, Toronto, Ontario, Canada, October 26-30, 2010}, pages = {929--938}, publisher = {{ACM}}, year = {2010}, url = {https://doi.org/10.1145/1871437.1871556}, doi = {10.1145/1871437.1871556}, timestamp = {Wed, 03 Aug 2022 15:48:33 +0200}, biburl = {https://dblp.org/rec/conf/cikm/WestPP10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/KaplowAP10, author = {Robert Kaplow and Amin Atrash and Joelle Pineau}, title = {Variable resolution decomposition for robotic navigation under a {POMDP} framework}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2010, Anchorage, Alaska, USA, 3-7 May 2010}, pages = {369--376}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/ROBOT.2010.5509188}, doi = {10.1109/ROBOT.2010.5509188}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/KaplowAP10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/GuezP10, author = {Arthur Guez and Joelle Pineau}, title = {Multi-tasking {SLAM}}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2010, Anchorage, Alaska, USA, 3-7 May 2010}, pages = {377--384}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/ROBOT.2010.5509969}, doi = {10.1109/ROBOT.2010.5509969}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/GuezP10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/FardP10, author = {Mahdi Milani Fard and Joelle Pineau}, editor = {John D. Lafferty and Christopher K. I. Williams and John Shawe{-}Taylor and Richard S. Zemel and Aron Culotta}, title = {PAC-Bayesian Model Selection for Reinforcement Learning}, booktitle = {Advances in Neural Information Processing Systems 23: 24th Annual Conference on Neural Information Processing Systems 2010. Proceedings of a meeting held 6-9 December 2010, Vancouver, British Columbia, Canada}, pages = {1624--1632}, publisher = {Curran Associates, Inc.}, year = {2010}, url = {https://proceedings.neurips.cc/paper/2010/hash/66368270ffd51418ec58bd793f2d9b1b-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/FardP10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/permis/Pineau0AVR10, author = {Joelle Pineau and Robert West and Amin Atrash and Julien Villemure and Fran{\c{c}}ois Routhier}, editor = {Elena Messina and Raj Madhavan}, title = {Towards a standardized test for intelligent wheelchairs}, booktitle = {Proceedings of the 10th Performance Metrics for Intelligent Systems Workshop, PerMIS 2010, Baltimore, Maryland, USA, September 28-30, 2010}, pages = {169--174}, publisher = {{ACM}}, year = {2010}, url = {https://doi.org/10.1145/2377576.2377607}, doi = {10.1145/2377576.2377607}, timestamp = {Wed, 04 Nov 2020 08:42:47 +0100}, biburl = {https://dblp.org/rec/conf/permis/Pineau0AVR10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/BunescuCCCCDDDFGGGHJJKKKLLMMMMPPRRSSSATWSWZ09, author = {Razvan C. Bunescu and Vitor R. Carvalho and Jan Chomicki and Vincent Conitzer and Michael T. Cox and Virginia Dignum and Zachary Dodds and Mark Dredze and David Furcy and Evgeniy Gabrilovich and Mehmet H. G{\"{o}}ker and Hans W. Guesgen and Haym Hirsh and Dietmar Jannach and Ulrich Junker and Wolfgang Ketter and Alfred Kobsa and Sven Koenig and Tessa A. Lau and Lundy Lewis and Eric T. Matson and Ted Metzler and Rada Mihalcea and Bamshad Mobasher and Joelle Pineau and Pascal Poupart and Anita Raja and Wheeler Ruml and Norman M. Sadeh and Guy Shani and Daniel G. Shapiro and Sarabjot Singh Anand and Matthew E. Taylor and Kiri Wagstaff and Trey Smith and William E. Walsh and Rong Zhou}, title = {{AAAI} 2008 Workshop Reports}, journal = {{AI} Mag.}, volume = {30}, number = {1}, pages = {108--118}, year = {2009}, url = {https://doi.org/10.1609/aimag.v30i1.2196}, doi = {10.1609/AIMAG.V30I1.2196}, timestamp = {Sun, 04 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/BunescuCCCCDDDFGGGHJJKKKLLMMMMPPRRSSSATWSWZ09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijns/PineauGVPA09, author = {Joelle Pineau and Arthur Guez and Robert D. Vincent and Gabriella Panuccio and Massimo Avoli}, title = {Treating Epilepsy via Adaptive Neurostimulation: a Reinforcement Learning Approach}, journal = {Int. J. Neural Syst.}, volume = {19}, number = {4}, pages = {227--240}, year = {2009}, url = {https://doi.org/10.1142/S0129065709001987}, doi = {10.1142/S0129065709001987}, timestamp = {Wed, 14 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ijns/PineauGVPA09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijsr/AtrashKVWYP09, author = {Amin Atrash and Robert Kaplow and Julien Villemure and Robert West and Hiba Yamani and Joelle Pineau}, title = {Development and Validation of a Robust Speech Interface for Improved Human-Robot Interaction}, journal = {Int. J. Soc. Robotics}, volume = {1}, number = {4}, pages = {345--356}, year = {2009}, url = {https://doi.org/10.1007/s12369-009-0032-4}, doi = {10.1007/S12369-009-0032-4}, timestamp = {Sat, 25 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijsr/AtrashKVWYP09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cikm/WestPP09, author = {Robert West and Doina Precup and Joelle Pineau}, editor = {David Wai{-}Lok Cheung and Il{-}Yeol Song and Wesley W. Chu and Xiaohua Hu and Jimmy Lin}, title = {Completing wikipedia's hyperlink structure through dimensionality reduction}, booktitle = {Proceedings of the 18th {ACM} Conference on Information and Knowledge Management, {CIKM} 2009, Hong Kong, China, November 2-6, 2009}, pages = {1097--1106}, publisher = {{ACM}}, year = {2009}, url = {https://doi.org/10.1145/1645953.1646093}, doi = {10.1145/1645953.1646093}, timestamp = {Fri, 27 Aug 2021 11:13:00 +0200}, biburl = {https://dblp.org/rec/conf/cikm/WestPP09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/WestPP09, author = {Robert West and Joelle Pineau and Doina Precup}, editor = {Craig Boutilier}, title = {Wikispeedia: An Online Game for Inferring Semantic Distances between Concepts}, booktitle = {{IJCAI} 2009, Proceedings of the 21st International Joint Conference on Artificial Intelligence, Pasadena, California, USA, July 11-17, 2009}, pages = {1598--1603}, year = {2009}, url = {http://ijcai.org/Proceedings/09/Papers/267.pdf}, timestamp = {Tue, 20 Aug 2019 16:16:40 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/WestPP09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iui/AtrashP09, author = {Amin Atrash and Joelle Pineau}, editor = {Cristina Conati and Mathias Bauer and Nuria Oliver and Daniel S. Weld}, title = {A bayesian reinforcement learning approach for customizing human-robot interfaces}, booktitle = {Proceedings of the 14th International Conference on Intelligent User Interfaces, {IUI} 2009, Sanibel Island, Florida, USA, February 8-11, 2009}, pages = {355--360}, publisher = {{ACM}}, year = {2009}, url = {https://doi.org/10.1145/1502650.1502700}, doi = {10.1145/1502650.1502700}, timestamp = {Tue, 06 Nov 2018 11:07:41 +0100}, biburl = {https://dblp.org/rec/conf/iui/AtrashP09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BushP09, author = {Keith Bush and Joelle Pineau}, editor = {Yoshua Bengio and Dale Schuurmans and John D. Lafferty and Christopher K. I. Williams and Aron Culotta}, title = {Manifold Embeddings for Model-Based Reinforcement Learning under Partial Observability}, booktitle = {Advances in Neural Information Processing Systems 22: 23rd Annual Conference on Neural Information Processing Systems 2009. Proceedings of a meeting held 7-10 December 2009, Vancouver, British Columbia, Canada}, pages = {189--197}, publisher = {Curran Associates, Inc.}, year = {2009}, url = {https://proceedings.neurips.cc/paper/2009/hash/a2557a7b2e94197ff767970b67041697-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/BushP09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/RossPPC08, author = {St{\'{e}}phane Ross and Joelle Pineau and S{\'{e}}bastien Paquet and Brahim Chaib{-}draa}, title = {Online Planning Algorithms for POMDPs}, journal = {J. Artif. Intell. Res.}, volume = {32}, pages = {663--704}, year = {2008}, url = {https://doi.org/10.1613/jair.2567}, doi = {10.1613/JAIR.2567}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jair/RossPPC08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/FardPS08, author = {Mahdi Milani Fard and Joelle Pineau and Peng Sun}, editor = {Dieter Fox and Carla P. Gomes}, title = {A Variance Analysis for {POMDP} Policy Evaluation}, booktitle = {Proceedings of the Twenty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2008, Chicago, Illinois, USA, July 13-17, 2008}, pages = {1056--1061}, publisher = {{AAAI} Press}, year = {2008}, url = {http://www.aaai.org/Library/AAAI/2008/aaai08-167.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/FardPS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/GuezVAP08, author = {Arthur Guez and Robert D. Vincent and Massimo Avoli and Joelle Pineau}, editor = {Dieter Fox and Carla P. Gomes}, title = {Adaptive Treatment of Epilepsy via Batch-mode Reinforcement Learning}, booktitle = {Proceedings of the Twenty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2008, Chicago, Illinois, USA, July 13-17, 2008}, pages = {1671--1678}, publisher = {{AAAI} Press}, year = {2008}, url = {http://www.aaai.org/Library/IAAI/2008/iaai08-008.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/GuezVAP08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/DoshiPR08, author = {Finale Doshi and Joelle Pineau and Nicholas Roy}, editor = {William W. Cohen and Andrew McCallum and Sam T. Roweis}, title = {Reinforcement learning with limited reinforcement: using Bayes risk for active learning in POMDPs}, booktitle = {Machine Learning, Proceedings of the Twenty-Fifth International Conference {(ICML} 2008), Helsinki, Finland, June 5-9, 2008}, series = {{ACM} International Conference Proceeding Series}, volume = {307}, pages = {256--263}, publisher = {{ACM}}, year = {2008}, url = {https://doi.org/10.1145/1390156.1390189}, doi = {10.1145/1390156.1390189}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/DoshiPR08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/RossCP08, author = {St{\'{e}}phane Ross and Brahim Chaib{-}draa and Joelle Pineau}, title = {Bayesian reinforcement learning in continuous POMDPs with application to robot navigation}, booktitle = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA} 2008, May 19-23, 2008, Pasadena, California, {USA}}, pages = {2845--2851}, publisher = {{IEEE}}, year = {2008}, url = {https://doi.org/10.1109/ROBOT.2008.4543641}, doi = {10.1109/ROBOT.2008.4543641}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icra/RossCP08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/isaim/DoshiPR08, author = {Finale Doshi and Joelle Pineau and Nicholas Roy}, title = {Reinforcement Learning with Limited Reinforcement: Using Bayes Risk for Active Learning in POMDPs}, booktitle = {International Symposium on Artificial Intelligence and Mathematics, {ISAIM} 2008, Fort Lauderdale, Florida, USA, January 2-4, 2008}, year = {2008}, url = {http://isaim2008.unl.edu/PAPERS/TechnicalProgram/ISAIM2008\_0044\_849d5727b40e38c8777f196c57cb519e.pdf}, timestamp = {Thu, 12 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/isaim/DoshiPR08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/isaim/PineauRC08, author = {Joelle Pineau and St{\'{e}}phane Ross and Brahim Chaib{-}draa}, title = {Bayes-Adaptive POMDPs: {A} New Perspective on the Explore-Exploit Tradeoff in Partially Observable Domains}, booktitle = {International Symposium on Artificial Intelligence and Mathematics, {ISAIM} 2008, Fort Lauderdale, Florida, USA, January 2-4, 2008}, year = {2008}, url = {http://isaim2008.unl.edu/PAPERS/SS3-ActiveLearning/jpineau-isaim08.pdf}, timestamp = {Thu, 12 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/isaim/PineauRC08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/FardP08, author = {Mahdi Milani Fard and Joelle Pineau}, editor = {Daphne Koller and Dale Schuurmans and Yoshua Bengio and L{\'{e}}on Bottou}, title = {MDPs with Non-Deterministic Policies}, booktitle = {Advances in Neural Information Processing Systems 21, Proceedings of the Twenty-Second Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 8-11, 2008}, pages = {1065--1072}, publisher = {Curran Associates, Inc.}, year = {2008}, url = {https://proceedings.neurips.cc/paper/2008/hash/0c74b7f78409a4022a2c4c5a5ca3ee19-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/FardP08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uai/RossP08, author = {St{\'{e}}phane Ross and Joelle Pineau}, editor = {David A. McAllester and Petri Myllym{\"{a}}ki}, title = {Model-Based Bayesian Reinforcement Learning in Large Structured Domains}, booktitle = {{UAI} 2008, Proceedings of the 24th Conference in Uncertainty in Artificial Intelligence, Helsinki, Finland, July 9-12, 2008}, pages = {476--483}, publisher = {{AUAI} Press}, year = {2008}, url = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=1967\&\#38;proceeding\_id=24}, timestamp = {Wed, 03 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/uai/RossP08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ria/JaulmesPP07, author = {Robin Jaulmes and Joelle Pineau and Doina Precup}, title = {Apprentissage actif dans les processus d{\'{e}}cisionnels de Markov partiellement observables L'algorithme {MEDUSA}}, journal = {Rev. d'Intelligence Artif.}, volume = {21}, number = {1}, pages = {9--34}, year = {2007}, url = {https://doi.org/10.3166/ria.21.9-33}, doi = {10.3166/RIA.21.9-33}, timestamp = {Wed, 16 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ria/JaulmesPP07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/HundtPPP07, author = {Christopher Hundt and Prakash Panangaden and Joelle Pineau and Doina Precup}, editor = {Clayton T. Morrison and Tim Oates}, title = {Representing Systems with Hidden State}, booktitle = {Computational Approaches to Representation Change during Learning and Development, Papers from the 2007 {AAAI} Fall Symposium, Arlington, Virginia, USA, November 9-11, 2007}, series = {{AAAI} Technical Report}, volume = {{FS-07-03}}, pages = {17--23}, publisher = {{AAAI} Press}, year = {2007}, url = {https://www.aaai.org/Library/Symposia/Fall/2007/fs07-03-003.php}, timestamp = {Sun, 16 Oct 2022 14:19:55 +0200}, biburl = {https://dblp.org/rec/conf/aaaifs/HundtPPP07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/PineauA07, author = {Joelle Pineau and Amin Atrash}, title = {SmartWheeler: {A} Robotic Wheelchair Test-Bed for Investigating New Models of Human-Robot Interaction}, booktitle = {Multidisciplinary Collaboration for Socially Assistive Robotics, Papers from the 2007 {AAAI} Spring Symposium, Technical Report SS-07-07, Stanford, California, USA, March 26-28, 2007}, pages = {59--64}, publisher = {{AAAI}}, year = {2007}, url = {http://www.aaai.org/Library/Symposia/Spring/2007/ss07-07-014.php}, timestamp = {Fri, 17 Feb 2012 14:15:32 +0100}, biburl = {https://dblp.org/rec/conf/aaaiss/PineauA07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ai/VincentPGA07, author = {Robert D. Vincent and Joelle Pineau and Philip de Guzman and Massimo Avoli}, editor = {Ziad Kobti and Dan Wu}, title = {Recurrent Boosting for Classification of Natural and Synthetic Time-Series Data}, booktitle = {Advances in Artificial Intelligence, 20th Conference of the Canadian Society for Computational Studies of Intelligence, Canadian {AI} 2007, Montreal, Canada, May 28-30, 2007, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4509}, pages = {192--203}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-72665-4\_17}, doi = {10.1007/978-3-540-72665-4\_17}, timestamp = {Thu, 28 Sep 2023 12:27:08 +0200}, biburl = {https://dblp.org/rec/conf/ai/VincentPGA07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/JaulmesPP07, author = {Robin Jaulmes and Joelle Pineau and Doina Precup}, title = {A formal framework for robot learning and control under model uncertainty}, booktitle = {2007 {IEEE} International Conference on Robotics and Automation, {ICRA} 2007, 10-14 April 2007, Roma, Italy}, pages = {2104--2110}, publisher = {{IEEE}}, year = {2007}, url = {https://doi.org/10.1109/ROBOT.2007.363632}, doi = {10.1109/ROBOT.2007.363632}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/JaulmesPP07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/RossCP07, author = {St{\'{e}}phane Ross and Brahim Chaib{-}draa and Joelle Pineau}, editor = {John C. Platt and Daphne Koller and Yoram Singer and Sam T. Roweis}, title = {Bayes-Adaptive POMDPs}, booktitle = {Advances in Neural Information Processing Systems 20, Proceedings of the Twenty-First Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 3-6, 2007}, pages = {1225--1232}, publisher = {Curran Associates, Inc.}, year = {2007}, url = {https://proceedings.neurips.cc/paper/2007/hash/3b3dbaf68507998acd6a5a5254ab2d76-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/RossCP07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/RossPC07, author = {St{\'{e}}phane Ross and Joelle Pineau and Brahim Chaib{-}draa}, editor = {John C. Platt and Daphne Koller and Yoram Singer and Sam T. Roweis}, title = {Theoretical Analysis of Heuristic Search Methods for Online POMDPs}, booktitle = {Advances in Neural Information Processing Systems 20, Proceedings of the Twenty-First Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 3-6, 2007}, pages = {1233--1240}, publisher = {Curran Associates, Inc.}, year = {2007}, url = {https://proceedings.neurips.cc/paper/2007/hash/138bb0696595b338afbab333c555292a-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/RossPC07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/PineauGT06, author = {Joelle Pineau and Geoffrey J. Gordon and Sebastian Thrun}, title = {Anytime Point-Based Approximations for Large POMDPs}, journal = {J. Artif. Intell. Res.}, volume = {27}, pages = {335--380}, year = {2006}, url = {https://doi.org/10.1613/jair.2078}, doi = {10.1613/JAIR.2078}, timestamp = {Mon, 21 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jair/PineauGT06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ras/VlassisGP06, author = {Nikos Vlassis and Geoffrey J. Gordon and Joelle Pineau}, title = {Planning under uncertainty in robotics}, journal = {Robotics Auton. Syst.}, volume = {54}, number = {11}, pages = {885--886}, year = {2006}, url = {https://doi.org/10.1016/j.robot.2006.06.001}, doi = {10.1016/J.ROBOT.2006.06.001}, timestamp = {Tue, 12 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ras/VlassisGP06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/HundtPPP06, author = {Christopher Hundt and Prakash Panangaden and Joelle Pineau and Doina Precup}, title = {Representing Systems with Hidden State}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {368--374}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-059.php}, timestamp = {Tue, 05 Sep 2023 09:10:47 +0200}, biburl = {https://dblp.org/rec/conf/aaai/HundtPPP06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aips/BurfootPD06, author = {Daniel Burfoot and Joelle Pineau and Gregory Dudek}, editor = {Derek Long and Stephen F. Smith and Daniel Borrajo and Lee McCluskey}, title = {RRT-Plan: {A} Randomized Algorithm for {STRIPS} Planning}, booktitle = {Proceedings of the Sixteenth International Conference on Automated Planning and Scheduling, {ICAPS} 2006, Cumbria, UK, June 6-10, 2006}, pages = {362--365}, publisher = {{AAAI}}, year = {2006}, url = {http://www.aaai.org/Library/ICAPS/2006/icaps06-041.php}, timestamp = {Fri, 05 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aips/BurfootPD06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ecml/GavaldaKPP06, author = {Ricard Gavald{\`{a}} and Philipp W. Keller and Joelle Pineau and Doina Precup}, editor = {Johannes F{\"{u}}rnkranz and Tobias Scheffer and Myra Spiliopoulou}, title = {PAC-Learning of Markov Models with Hidden State}, booktitle = {Machine Learning: {ECML} 2006, 17th European Conference on Machine Learning, Berlin, Germany, September 18-22, 2006, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4212}, pages = {150--161}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/11871842\_18}, doi = {10.1007/11871842\_18}, timestamp = {Sun, 25 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ecml/GavaldaKPP06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ecml/JaulmesPP05, author = {Robin Jaulmes and Joelle Pineau and Doina Precup}, editor = {Jo{\~{a}}o Gama and Rui Camacho and Pavel Brazdil and Al{\'{\i}}pio Jorge and Lu{\'{\i}}s Torgo}, title = {Active Learning in Partially Observable Markov Decision Processes}, booktitle = {Machine Learning: {ECML} 2005, 16th European Conference on Machine Learning, Porto, Portugal, October 3-7, 2005, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {3720}, pages = {601--608}, publisher = {Springer}, year = {2005}, url = {https://doi.org/10.1007/11564096\_59}, doi = {10.1007/11564096\_59}, timestamp = {Wed, 24 Mar 2021 17:12:00 +0100}, biburl = {https://dblp.org/rec/conf/ecml/JaulmesPP05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/isrr/PineauG05, author = {Joelle Pineau and Geoffrey J. Gordon}, editor = {Sebastian Thrun and Rodney A. Brooks and Hugh F. Durrant{-}Whyte}, title = {{POMDP} Planning for Robust Robot Control}, booktitle = {Robotics Research: Results of the 12th International Symposium, {ISRR} 2005, October 12-15, 2005, San Francisco, CA, {USA}}, series = {Springer Tracts in Advanced Robotics}, volume = {28}, pages = {69--82}, publisher = {Springer}, year = {2005}, url = {https://doi.org/10.1007/978-3-540-48113-3\_7}, doi = {10.1007/978-3-540-48113-3\_7}, timestamp = {Wed, 14 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/isrr/PineauG05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ras/PineauMPRT03, author = {Joelle Pineau and Michael Montemerlo and Martha E. Pollack and Nicholas Roy and Sebastian Thrun}, title = {Towards robotic assistants in nursing homes: Challenges and results}, journal = {Robotics Auton. Syst.}, volume = {42}, number = {3-4}, pages = {271--281}, year = {2003}, url = {https://doi.org/10.1016/S0921-8890(02)00381-0}, doi = {10.1016/S0921-8890(02)00381-0}, timestamp = {Mon, 24 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ras/PineauMPRT03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/PineauGT03, author = {Joelle Pineau and Geoffrey J. Gordon and Sebastian Thrun}, editor = {Georg Gottlob and Toby Walsh}, title = {Point-based value iteration: An anytime algorithm for POMDPs}, booktitle = {IJCAI-03, Proceedings of the Eighteenth International Joint Conference on Artificial Intelligence, Acapulco, Mexico, August 9-15, 2003}, pages = {1025--1032}, publisher = {Morgan Kaufmann}, year = {2003}, url = {http://ijcai.org/Proceedings/03/Papers/147.pdf}, timestamp = {Tue, 20 Aug 2019 16:18:41 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/PineauGT03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PineauGT03, author = {Joelle Pineau and Geoffrey J. Gordon and Sebastian Thrun}, editor = {Sebastian Thrun and Lawrence K. Saul and Bernhard Sch{\"{o}}lkopf}, title = {Applying Metric-Trees to Belief-Point POMDPs}, booktitle = {Advances in Neural Information Processing Systems 16 [Neural Information Processing Systems, {NIPS} 2003, December 8-13, 2003, Vancouver and Whistler, British Columbia, Canada]}, pages = {759--766}, publisher = {{MIT} Press}, year = {2003}, url = {https://proceedings.neurips.cc/paper/2003/hash/6547884cea64550284728eb26b0947ef-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/PineauGT03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uai/PineauGT03, author = {Joelle Pineau and Geoffrey J. Gordon and Sebastian Thrun}, editor = {Christopher Meek and Uffe Kj{\ae}rulff}, title = {Policy-contingent abstraction for robust robot control}, booktitle = {{UAI} '03, Proceedings of the 19th Conference in Uncertainty in Artificial Intelligence, Acapulco, Mexico, August 7-10 2003}, pages = {477--484}, publisher = {Morgan Kaufmann}, year = {2003}, url = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=964\&\#38;proceeding\_id=19}, timestamp = {Wed, 03 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/uai/PineauGT03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/MontemerloPRTV02, author = {Michael Montemerlo and Joelle Pineau and Nicholas Roy and Sebastian Thrun and Vandi Verma}, editor = {Rina Dechter and Michael J. Kearns and Richard S. Sutton}, title = {Experiences with a Mobile Robotic Guide for the Elderly}, booktitle = {Proceedings of the Eighteenth National Conference on Artificial Intelligence and Fourteenth Conference on Innovative Applications of Artificial Intelligence, July 28 - August 1, 2002, Edmonton, Alberta, Canada}, pages = {587--592}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2002}, url = {http://www.aaai.org/Library/AAAI/2002/aaai02-088.php}, timestamp = {Tue, 05 Sep 2023 09:10:47 +0200}, biburl = {https://dblp.org/rec/conf/aaai/MontemerloPRTV02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/amia/MatthewsEMPRRT02, author = {Judith T. Matthews and Sandra Engberg and Michael Montemerlo and Joelle Pineau and Nicholas Roy and Joan Rogers and Sebastian Thrun}, title = {Robotic Assistance During Ambulation by Older Adults}, booktitle = {{AMIA} 2002, American Medical Informatics Association Annual Symposium, San Antonio, TX, USA, November 9-13, 2002}, publisher = {{AMIA}}, year = {2002}, url = {https://knowledge.amia.org/amia-55142-a2002a-1.610020/t-002-1.611916/f-001-1.611917/a-333-1.612245/a-334-1.612242}, timestamp = {Wed, 17 Apr 2024 11:48:33 +0200}, biburl = {https://dblp.org/rec/conf/amia/MatthewsEMPRRT02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/RoyPT00, author = {Nicholas Roy and Joelle Pineau and Sebastian Thrun}, title = {Spoken Dialogue Management Using Probabilistic Reasoning}, booktitle = {38th Annual Meeting of the Association for Computational Linguistics, Hong Kong, China, October 1-8, 2000}, pages = {93--100}, publisher = {{ACL}}, year = {2000}, url = {https://aclanthology.org/P00-1013/}, doi = {10.3115/1075218.1075231}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/RoyPT00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/GoddeauP00, author = {David Goddeau and Joelle Pineau}, title = {Fast reinforcement learning of dialog strategies}, booktitle = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing. {ICASSP} 2000, 5-9 June, 2000, Hilton Hotel and Convention Center, Istanbul, Turkey}, pages = {1233--1236}, publisher = {{IEEE}}, year = {2000}, url = {https://doi.org/10.1109/ICASSP.2000.859189}, doi = {10.1109/ICASSP.2000.859189}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/GoddeauP00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.