BibTeX records: Dzmitry Bahdanau

download as .bib file

@inproceedings{DBLP:conf/emnlp/PatelBRB23,
  author       = {Arkil Patel and
                  Satwik Bhattamishra and
                  Siva Reddy and
                  Dzmitry Bahdanau},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {MAGNIFICo: Evaluating the In-Context Learning Ability of Large Language
                  Models to Generalize to Novel Interpretations},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {2167--2189},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.134},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.134},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/PatelBRB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SahuVBL23,
  author       = {Gaurav Sahu and
                  Olga Vechtomova and
                  Dzmitry Bahdanau and
                  Issam H. Laradji},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {PromptMix: {A} Class Boundary Augmentation Method for Large Language
                  Model Distillation},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {5316--5327},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.323},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.323},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SahuVBL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-03988,
  author       = {Loubna Ben Allal and
                  Raymond Li and
                  Denis Kocetkov and
                  Chenghao Mou and
                  Christopher Akiki and
                  Carlos Mu{\~{n}}oz Ferrandis and
                  Niklas Muennighoff and
                  Mayank Mishra and
                  Alex Gu and
                  Manan Dey and
                  Logesh Kumar Umapathi and
                  Carolyn Jane Anderson and
                  Yangtian Zi and
                  Joel Lamy{-}Poirier and
                  Hailey Schoelkopf and
                  Sergey Troshin and
                  Dmitry Abulkhanov and
                  Manuel Romero and
                  Michael Lappert and
                  Francesco De Toni and
                  Bernardo Garc{\'{\i}}a del R{\'{\i}}o and
                  Qian Liu and
                  Shamik Bose and
                  Urvashi Bhattacharyya and
                  Terry Yue Zhuo and
                  Ian Yu and
                  Paulo Villegas and
                  Marco Zocca and
                  Sourab Mangrulkar and
                  David Lansky and
                  Huu Nguyen and
                  Danish Contractor and
                  Luis Villa and
                  Jia Li and
                  Dzmitry Bahdanau and
                  Yacine Jernite and
                  Sean Hughes and
                  Daniel Fried and
                  Arjun Guha and
                  Harm de Vries and
                  Leandro von Werra},
  title        = {SantaCoder: don't reach for the stars!},
  journal      = {CoRR},
  volume       = {abs/2301.03988},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.03988},
  doi          = {10.48550/ARXIV.2301.03988},
  eprinttype    = {arXiv},
  eprint       = {2301.03988},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-03988.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-06161,
  author       = {Raymond Li and
                  Loubna Ben Allal and
                  Yangtian Zi and
                  Niklas Muennighoff and
                  Denis Kocetkov and
                  Chenghao Mou and
                  Marc Marone and
                  Christopher Akiki and
                  Jia Li and
                  Jenny Chim and
                  Qian Liu and
                  Evgenii Zheltonozhskii and
                  Terry Yue Zhuo and
                  Thomas Wang and
                  Olivier Dehaene and
                  Mishig Davaadorj and
                  Joel Lamy{-}Poirier and
                  Jo{\~{a}}o Monteiro and
                  Oleh Shliazhko and
                  Nicolas Gontier and
                  Nicholas Meade and
                  Armel Zebaze and
                  Ming{-}Ho Yee and
                  Logesh Kumar Umapathi and
                  Jian Zhu and
                  Benjamin Lipkin and
                  Muhtasham Oblokulov and
                  Zhiruo Wang and
                  Rudra Murthy V and
                  Jason Stillerman and
                  Siva Sankalp Patel and
                  Dmitry Abulkhanov and
                  Marco Zocca and
                  Manan Dey and
                  Zhihan Zhang and
                  Nour Moustafa{-}Fahmy and
                  Urvashi Bhattacharyya and
                  Wenhao Yu and
                  Swayam Singh and
                  Sasha Luccioni and
                  Paulo Villegas and
                  Maxim Kunakov and
                  Fedor Zhdanov and
                  Manuel Romero and
                  Tony Lee and
                  Nadav Timor and
                  Jennifer Ding and
                  Claire Schlesinger and
                  Hailey Schoelkopf and
                  Jan Ebert and
                  Tri Dao and
                  Mayank Mishra and
                  Alex Gu and
                  Jennifer Robinson and
                  Carolyn Jane Anderson and
                  Brendan Dolan{-}Gavitt and
                  Danish Contractor and
                  Siva Reddy and
                  Daniel Fried and
                  Dzmitry Bahdanau and
                  Yacine Jernite and
                  Carlos Mu{\~{n}}oz Ferrandis and
                  Sean Hughes and
                  Thomas Wolf and
                  Arjun Guha and
                  Leandro von Werra and
                  Harm de Vries},
  title        = {StarCoder: may the source be with you!},
  journal      = {CoRR},
  volume       = {abs/2305.06161},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.06161},
  doi          = {10.48550/ARXIV.2305.06161},
  eprinttype    = {arXiv},
  eprint       = {2305.06161},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-06161.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-10998,
  author       = {Disha Shrivastava and
                  Denis Kocetkov and
                  Harm de Vries and
                  Dzmitry Bahdanau and
                  Torsten Scholak},
  title        = {RepoFusion: Training Code Models to Understand Your Repository},
  journal      = {CoRR},
  volume       = {abs/2306.10998},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.10998},
  doi          = {10.48550/ARXIV.2306.10998},
  eprinttype    = {arXiv},
  eprint       = {2306.10998},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-10998.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-10954,
  author       = {Aristides Milios and
                  Siva Reddy and
                  Dzmitry Bahdanau},
  title        = {In-Context Learning for Text Classification with Many Labels},
  journal      = {CoRR},
  volume       = {abs/2309.10954},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.10954},
  doi          = {10.48550/ARXIV.2309.10954},
  eprinttype    = {arXiv},
  eprint       = {2309.10954},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-10954.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-11634,
  author       = {Arkil Patel and
                  Satwik Bhattamishra and
                  Siva Reddy and
                  Dzmitry Bahdanau},
  title        = {MAGNIFICo: Evaluating the In-Context Learning Ability of Large Language
                  Models to Generalize to Novel Interpretations},
  journal      = {CoRR},
  volume       = {abs/2310.11634},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.11634},
  doi          = {10.48550/ARXIV.2310.11634},
  eprinttype    = {arXiv},
  eprint       = {2310.11634},
  timestamp    = {Fri, 27 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-11634.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-14192,
  author       = {Gaurav Sahu and
                  Olga Vechtomova and
                  Dzmitry Bahdanau and
                  Issam H. Laradji},
  title        = {PromptMix: {A} Class Boundary Augmentation Method for Large Language
                  Model Distillation},
  journal      = {CoRR},
  volume       = {abs/2310.14192},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.14192},
  doi          = {10.48550/ARXIV.2310.14192},
  eprinttype    = {arXiv},
  eprint       = {2310.14192},
  timestamp    = {Mon, 30 Oct 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-14192.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-09635,
  author       = {Arkil Patel and
                  Siva Reddy and
                  Dzmitry Bahdanau and
                  Pradeep Dasigi},
  title        = {Evaluating In-Context Learning of Libraries for Code Generation},
  journal      = {CoRR},
  volume       = {abs/2311.09635},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.09635},
  doi          = {10.48550/ARXIV.2311.09635},
  eprinttype    = {arXiv},
  eprint       = {2311.09635},
  timestamp    = {Tue, 21 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-09635.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/JamborB22,
  author       = {Dora Jambor and
                  Dzmitry Bahdanau},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {LAGr: Label Aligned Graphs for Better Systematic Generalization in
                  Semantic Parsing},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {3295--3308},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.233},
  doi          = {10.18653/V1/2022.ACL-LONG.233},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/JamborB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/GoodwinROB22,
  author       = {Emily Goodwin and
                  Siva Reddy and
                  Timothy J. O'Donnell and
                  Dzmitry Bahdanau},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {Compositional Generalization in Dependency Parsing},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {6482--6493},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.448},
  doi          = {10.18653/V1/2022.ACL-LONG.448},
  timestamp    = {Sat, 28 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/GoodwinROB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl-convai/SahuRLAVB22,
  author       = {Gaurav Sahu and
                  Pau Rodr{\'{\i}}guez and
                  Issam H. Laradji and
                  Parmida Atighehchian and
                  David V{\'{a}}zquez and
                  Dzmitry Bahdanau},
  editor       = {Bing Liu and
                  Alexandros Papangelis and
                  Stefan Ultes and
                  Abhinav Rastogi and
                  Yun{-}Nung Chen and
                  Georgios Spithourakis and
                  Elnaz Nouri and
                  Weiyan Shi},
  title        = {Data Augmentation for Intent Classification with Off-the-shelf Large
                  Language Models},
  booktitle    = {Proceedings of the 4th Workshop on {NLP} for Conversational AI, ConvAI@ACL
                  2022, Dublin, Ireland, May 27, 2022},
  pages        = {47--57},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.nlp4convai-1.5},
  doi          = {10.18653/V1/2022.NLP4CONVAI-1.5},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl-convai/SahuRLAVB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/blackboxnlp/HosseiniVBSC22,
  author       = {Arian Hosseini and
                  Ankit Vani and
                  Dzmitry Bahdanau and
                  Alessandro Sordoni and
                  Aaron C. Courville},
  editor       = {Jasmijn Bastings and
                  Yonatan Belinkov and
                  Yanai Elazar and
                  Dieuwke Hupkes and
                  Naomi Saphra and
                  Sarah Wiegreffe},
  title        = {On the Compositional Generalization Gap of In-Context Learning},
  booktitle    = {Proceedings of the Fifth BlackboxNLP Workshop on Analyzing and Interpreting
                  Neural Networks for NLP, BlackboxNLP@EMNLP 2022, Abu Dhabi, United
                  Arab Emirates (Hybrid), December 8, 2022},
  pages        = {272--280},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.blackboxnlp-1.22},
  doi          = {10.18653/V1/2022.BLACKBOXNLP-1.22},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/blackboxnlp/HosseiniVBSC22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-00498,
  author       = {Nitarshan Rajkumar and
                  Raymond Li and
                  Dzmitry Bahdanau},
  title        = {Evaluating the Text-to-SQL Capabilities of Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2204.00498},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.00498},
  doi          = {10.48550/ARXIV.2204.00498},
  eprinttype    = {arXiv},
  eprint       = {2204.00498},
  timestamp    = {Wed, 06 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-00498.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-01959,
  author       = {Gaurav Sahu and
                  Pau Rodr{\'{\i}}guez and
                  Issam H. Laradji and
                  Parmida Atighehchian and
                  David V{\'{a}}zquez and
                  Dzmitry Bahdanau},
  title        = {Data Augmentation for Intent Classification with Off-the-shelf Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2204.01959},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.01959},
  doi          = {10.48550/ARXIV.2204.01959},
  eprinttype    = {arXiv},
  eprint       = {2204.01959},
  timestamp    = {Wed, 06 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-01959.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-08473,
  author       = {Arian Hosseini and
                  Ankit Vani and
                  Dzmitry Bahdanau and
                  Alessandro Sordoni and
                  Aaron C. Courville},
  title        = {On the Compositional Generalization Gap of In-Context Learning},
  journal      = {CoRR},
  volume       = {abs/2211.08473},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.08473},
  doi          = {10.48550/ARXIV.2211.08473},
  eprinttype    = {arXiv},
  eprint       = {2211.08473},
  timestamp    = {Wed, 23 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-08473.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-15533,
  author       = {Denis Kocetkov and
                  Raymond Li and
                  Loubna Ben Allal and
                  Jia Li and
                  Chenghao Mou and
                  Carlos Mu{\~{n}}oz Ferrandis and
                  Yacine Jernite and
                  Margaret Mitchell and
                  Sean Hughes and
                  Thomas Wolf and
                  Dzmitry Bahdanau and
                  Leandro von Werra and
                  Harm de Vries},
  title        = {The Stack: 3 {TB} of permissively licensed source code},
  journal      = {CoRR},
  volume       = {abs/2211.15533},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.15533},
  doi          = {10.48550/ARXIV.2211.15533},
  eprinttype    = {arXiv},
  eprint       = {2211.15533},
  timestamp    = {Tue, 29 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-15533.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ScholakSB21,
  author       = {Torsten Scholak and
                  Nathan Schucher and
                  Dzmitry Bahdanau},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {{PICARD:} Parsing Incrementally for Constrained Auto-Regressive Decoding
                  from Language Models},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {9895--9901},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.779},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.779},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ScholakSB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/ZolnaSBHCBB21,
  author       = {Konrad Zolna and
                  Chitwan Saharia and
                  L{\'{e}}onard Boussioux and
                  David Yu{-}Tung Hui and
                  Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {Combating False Negatives in Adversarial Imitation Learning},
  booktitle    = {International Joint Conference on Neural Networks, {IJCNN} 2021, Shenzhen,
                  China, July 18-22, 2021},
  pages        = {1--9},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IJCNN52387.2021.9534032},
  doi          = {10.1109/IJCNN52387.2021.9534032},
  timestamp    = {Wed, 29 Sep 2021 17:00:55 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnn/ZolnaSBHCBB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/HosseiniRBHSC21,
  author       = {Arian Hosseini and
                  Siva Reddy and
                  Dzmitry Bahdanau and
                  R. Devon Hjelm and
                  Alessandro Sordoni and
                  Aaron C. Courville},
  editor       = {Kristina Toutanova and
                  Anna Rumshisky and
                  Luke Zettlemoyer and
                  Dilek Hakkani{-}T{\"{u}}r and
                  Iz Beltagy and
                  Steven Bethard and
                  Ryan Cotterell and
                  Tanmoy Chakraborty and
                  Yichao Zhou},
  title        = {Understanding by Understanding Not: Modeling Negation in Language
                  Models},
  booktitle    = {Proceedings of the 2021 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2021, Online, June 6-11, 2021},
  pages        = {1301--1312},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.naacl-main.102},
  doi          = {10.18653/V1/2021.NAACL-MAIN.102},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/HosseiniRBHSC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/ScholakLBVP21,
  author       = {Torsten Scholak and
                  Raymond Li and
                  Dzmitry Bahdanau and
                  Harm de Vries and
                  Chris Pal},
  editor       = {Kristina Toutanova and
                  Anna Rumshisky and
                  Luke Zettlemoyer and
                  Dilek Hakkani{-}T{\"{u}}r and
                  Iz Beltagy and
                  Steven Bethard and
                  Ryan Cotterell and
                  Tanmoy Chakraborty and
                  Yichao Zhou},
  title        = {DuoRAT: Towards Simpler Text-to-SQL Models},
  booktitle    = {Proceedings of the 2021 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2021, Online, June 6-11, 2021},
  pages        = {1313--1321},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.naacl-main.103},
  doi          = {10.18653/V1/2021.NAACL-MAIN.103},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/ScholakLBVP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BergenOB21,
  author       = {Leon Bergen and
                  Timothy J. O'Donnell and
                  Dzmitry Bahdanau},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Systematic Generalization with Edge Transformers},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {1390--1402},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/0a4dc6dae338c9cb08947c07581f77a2-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BergenOB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-06645,
  author       = {Leon Bergen and
                  Dzmitry Bahdanau and
                  Timothy J. O'Donnell},
  title        = {Jointly Learning Truth-Conditional Denotations and Groundings using
                  Parallel Attention},
  journal      = {CoRR},
  volume       = {abs/2104.06645},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.06645},
  eprinttype    = {arXiv},
  eprint       = {2104.06645},
  timestamp    = {Mon, 19 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-06645.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-03519,
  author       = {Arian Hosseini and
                  Siva Reddy and
                  Dzmitry Bahdanau and
                  R. Devon Hjelm and
                  Alessandro Sordoni and
                  Aaron C. Courville},
  title        = {Understanding by Understanding Not: Modeling Negation in Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2105.03519},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.03519},
  eprinttype    = {arXiv},
  eprint       = {2105.03519},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-03519.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-05093,
  author       = {Torsten Scholak and
                  Nathan Schucher and
                  Dzmitry Bahdanau},
  title        = {{PICARD:} Parsing Incrementally for Constrained Auto-Regressive Decoding
                  from Language Models},
  journal      = {CoRR},
  volume       = {abs/2109.05093},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.05093},
  eprinttype    = {arXiv},
  eprint       = {2109.05093},
  timestamp    = {Tue, 21 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-05093.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-06843,
  author       = {Emily Goodwin and
                  Siva Reddy and
                  Timothy J. O'Donnell and
                  Dzmitry Bahdanau},
  title        = {Compositional Generalization in Dependency Parsing},
  journal      = {CoRR},
  volume       = {abs/2110.06843},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.06843},
  eprinttype    = {arXiv},
  eprint       = {2110.06843},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-06843.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-07572,
  author       = {Dora Jambor and
                  Dzmitry Bahdanau},
  title        = {LAGr: Labeling Aligned Graphs for Improving Systematic Generalization
                  in Semantic Parsing},
  journal      = {CoRR},
  volume       = {abs/2110.07572},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.07572},
  eprinttype    = {arXiv},
  eprint       = {2110.07572},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-07572.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-00578,
  author       = {Leon Bergen and
                  Timothy J. O'Donnell and
                  Dzmitry Bahdanau},
  title        = {Systematic Generalization with Edge Transformers},
  journal      = {CoRR},
  volume       = {abs/2112.00578},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.00578},
  eprinttype    = {arXiv},
  eprint       = {2112.00578},
  timestamp    = {Tue, 07 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-00578.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ZolnaSBHCBB20,
  author       = {Konrad Zolna and
                  Chitwan Saharia and
                  L{\'{e}}onard Boussioux and
                  David Yu{-}Tung Hui and
                  Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {Combating False Negatives in Adversarial Imitation Learning (Student
                  Abstract)},
  booktitle    = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2020, The Thirty-Second Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA,
                  February 7-12, 2020},
  pages        = {13999--14000},
  publisher    = {{AAAI} Press},
  year         = {2020},
  url          = {https://doi.org/10.1609/aaai.v34i10.7272},
  doi          = {10.1609/AAAI.V34I10.7272},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ZolnaSBHCBB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-00412,
  author       = {Konrad Zolna and
                  Chitwan Saharia and
                  L{\'{e}}onard Boussioux and
                  David Yu{-}Tung Hui and
                  Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {Combating False Negatives in Adversarial Imitation Learning},
  journal      = {CoRR},
  volume       = {abs/2002.00412},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.00412},
  eprinttype    = {arXiv},
  eprint       = {2002.00412},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-00412.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-12770,
  author       = {David Yu{-}Tung Hui and
                  Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {BabyAI 1.1},
  journal      = {CoRR},
  volume       = {abs/2007.12770},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.12770},
  eprinttype    = {arXiv},
  eprint       = {2007.12770},
  timestamp    = {Wed, 29 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-12770.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-14435,
  author       = {Harm de Vries and
                  Dzmitry Bahdanau and
                  Christopher D. Manning},
  title        = {Towards Ecologically Valid Research on Language User Interfaces},
  journal      = {CoRR},
  volume       = {abs/2007.14435},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.14435},
  eprinttype    = {arXiv},
  eprint       = {2007.14435},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-14435.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-11119,
  author       = {Torsten Scholak and
                  Raymond Li and
                  Dzmitry Bahdanau and
                  Harm de Vries and
                  Chris Pal},
  title        = {DuoRAT: Towards Simpler Text-to-SQL Models},
  journal      = {CoRR},
  volume       = {abs/2010.11119},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.11119},
  eprinttype    = {arXiv},
  eprint       = {2010.11119},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-11119.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BahdanauHLHHKG19,
  author       = {Dzmitry Bahdanau and
                  Felix Hill and
                  Jan Leike and
                  Edward Hughes and
                  Seyed Arian Hosseini and
                  Pushmeet Kohli and
                  Edward Grefenstette},
  title        = {Learning to Understand Goal Specifications by Modelling Reward},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=H1xsSjC9Ym},
  timestamp    = {Fri, 09 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BahdanauHLHHKG19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BahdanauMNNVC19,
  author       = {Dzmitry Bahdanau and
                  Shikhar Murty and
                  Michael Noukhovitch and
                  Thien Huu Nguyen and
                  Harm de Vries and
                  Aaron C. Courville},
  title        = {Systematic Generalization: What Is Required and Can It Be Learned?},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=HkezXnA9YX},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BahdanauMNNVC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Chevalier-Boisvert19,
  author       = {Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Salem Lahlou and
                  Lucas Willems and
                  Chitwan Saharia and
                  Thien Huu Nguyen and
                  Yoshua Bengio},
  title        = {BabyAI: {A} Platform to Study the Sample Efficiency of Grounded Language
                  Learning},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=rJeXCo0cYX},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Chevalier-Boisvert19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/VriesBMCB19,
  author       = {Harm de Vries and
                  Dzmitry Bahdanau and
                  Shikhar Murty and
                  Aaron C. Courville and
                  Philippe Beaudoin},
  title        = {{CLOSURE:} Assessing Systematic Generalization of {CLEVR} Models},
  booktitle    = {Visually Grounded Interaction and Language (ViGIL), NeurIPS 2019 Workshop,
                  Vancouver, Canada, December 13, 2019},
  year         = {2019},
  url          = {https://vigilworkshop.github.io/static/papers/28.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/VriesBMCB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-00444,
  author       = {Anirudh Srinivasan and
                  Dzmitry Bahdanau and
                  Maxime Chevalier{-}Boisvert and
                  Yoshua Bengio},
  title        = {Automated curriculum generation for Policy Gradients from Demonstrations},
  journal      = {CoRR},
  volume       = {abs/1912.00444},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.00444},
  eprinttype    = {arXiv},
  eprint       = {1912.00444},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-00444.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-05783,
  author       = {Dzmitry Bahdanau and
                  Harm de Vries and
                  Timothy J. O'Donnell and
                  Shikhar Murty and
                  Philippe Beaudoin and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {{CLOSURE:} Assessing Systematic Generalization of {CLEVR} Models},
  journal      = {CoRR},
  volume       = {abs/1912.05783},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.05783},
  eprinttype    = {arXiv},
  eprint       = {1912.05783},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-05783.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BahdanauHLHKG18,
  author       = {Dzmitry Bahdanau and
                  Felix Hill and
                  Jan Leike and
                  Edward Hughes and
                  Pushmeet Kohli and
                  Edward Grefenstette},
  title        = {Jointly Learning "What" and "How" from Instructions
                  and Goal-States},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=BkmZvdkPM},
  timestamp    = {Fri, 09 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BahdanauHLHKG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-09259,
  author       = {Stanislaw Jastrzebski and
                  Dzmitry Bahdanau and
                  Seyedarian Hosseini and
                  Michael Noukhovitch and
                  Yoshua Bengio and
                  Jackie Chi Kit Cheung},
  title        = {Commonsense mining as knowledge base completion? {A} study on the
                  impact of novelty},
  journal      = {CoRR},
  volume       = {abs/1804.09259},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.09259},
  eprinttype    = {arXiv},
  eprint       = {1804.09259},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-09259.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-01946,
  author       = {Dzmitry Bahdanau and
                  Felix Hill and
                  Jan Leike and
                  Edward Hughes and
                  Pushmeet Kohli and
                  Edward Grefenstette},
  title        = {Learning to Follow Language Instructions with Adversarial Reward Induction},
  journal      = {CoRR},
  volume       = {abs/1806.01946},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.01946},
  eprinttype    = {arXiv},
  eprint       = {1806.01946},
  timestamp    = {Fri, 09 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-01946.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-08272,
  author       = {Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Salem Lahlou and
                  Lucas Willems and
                  Chitwan Saharia and
                  Thien Huu Nguyen and
                  Yoshua Bengio},
  title        = {BabyAI: First Steps Towards Grounded Language Learning With a Human
                  In the Loop},
  journal      = {CoRR},
  volume       = {abs/1810.08272},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.08272},
  eprinttype    = {arXiv},
  eprint       = {1810.08272},
  timestamp    = {Wed, 31 Oct 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-08272.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-12889,
  author       = {Dzmitry Bahdanau and
                  Shikhar Murty and
                  Michael Noukhovitch and
                  Thien Huu Nguyen and
                  Harm de Vries and
                  Aaron C. Courville},
  title        = {Systematic Generalization: What Is Required and Can It Be Learned?},
  journal      = {CoRR},
  volume       = {abs/1811.12889},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.12889},
  eprinttype    = {arXiv},
  eprint       = {1811.12889},
  timestamp    = {Mon, 03 Dec 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-12889.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BahdanauBXGLPCB17,
  author       = {Dzmitry Bahdanau and
                  Philemon Brakel and
                  Kelvin Xu and
                  Anirudh Goyal and
                  Ryan Lowe and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {An Actor-Critic Algorithm for Sequence Prediction},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=SJDaqqveg},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BahdanauBXGLPCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JaquesGBHTE17,
  author       = {Natasha Jaques and
                  Shixiang Gu and
                  Dzmitry Bahdanau and
                  Jos{\'{e}} Miguel Hern{\'{a}}ndez{-}Lobato and
                  Richard E. Turner and
                  Douglas Eck},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Sequence Tutor: Conservative Fine-Tuning of Sequence Generation Models
                  with KL-control},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {1645--1654},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/jaques17a.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/JaquesGBHTE17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauBJGVB17,
  author       = {Dzmitry Bahdanau and
                  Tom Bosc and
                  Stanislaw Jastrzebski and
                  Edward Grefenstette and
                  Pascal Vincent and
                  Yoshua Bengio},
  title        = {Learning to Compute Word Embeddings On the Fly},
  journal      = {CoRR},
  volume       = {abs/1706.00286},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.00286},
  eprinttype    = {arXiv},
  eprint       = {1706.00286},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauBJGVB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BahdanauCSBB16,
  author       = {Dzmitry Bahdanau and
                  Jan Chorowski and
                  Dmitriy Serdyuk and
                  Philemon Brakel and
                  Yoshua Bengio},
  title        = {End-to-end attention-based large vocabulary speech recognition},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {4945--4949},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7472618},
  doi          = {10.1109/ICASSP.2016.7472618},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BahdanauCSBB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/Al-RfouAAa16,
  author       = {Rami Al{-}Rfou and
                  Guillaume Alain and
                  Amjad Almahairi and
                  Christof Angerm{\"{u}}ller and
                  Dzmitry Bahdanau and
                  Nicolas Ballas and
                  Fr{\'{e}}d{\'{e}}ric Bastien and
                  Justin Bayer and
                  Anatoly Belikov and
                  Alexander Belopolsky and
                  Yoshua Bengio and
                  Arnaud Bergeron and
                  James Bergstra and
                  Valentin Bisson and
                  Josh Bleecher Snyder and
                  Nicolas Bouchard and
                  Nicolas Boulanger{-}Lewandowski and
                  Xavier Bouthillier and
                  Alexandre de Br{\'{e}}bisson and
                  Olivier Breuleux and
                  Pierre Luc Carrier and
                  Kyunghyun Cho and
                  Jan Chorowski and
                  Paul F. Christiano and
                  Tim Cooijmans and
                  Marc{-}Alexandre C{\^{o}}t{\'{e}} and
                  Myriam C{\^{o}}t{\'{e}} and
                  Aaron C. Courville and
                  Yann N. Dauphin and
                  Olivier Delalleau and
                  Julien Demouth and
                  Guillaume Desjardins and
                  Sander Dieleman and
                  Laurent Dinh and
                  Melanie Ducoffe and
                  Vincent Dumoulin and
                  Samira Ebrahimi Kahou and
                  Dumitru Erhan and
                  Ziye Fan and
                  Orhan Firat and
                  Mathieu Germain and
                  Xavier Glorot and
                  Ian J. Goodfellow and
                  Matthew Graham and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Philippe Hamel and
                  Iban Harlouchet and
                  Jean{-}Philippe Heng and
                  Bal{\'{a}}zs Hidasi and
                  Sina Honari and
                  Arjun Jain and
                  S{\'{e}}bastien Jean and
                  Kai Jia and
                  Mikhail Korobov and
                  Vivek Kulkarni and
                  Alex Lamb and
                  Pascal Lamblin and
                  Eric Larsen and
                  C{\'{e}}sar Laurent and
                  Sean Lee and
                  Simon Lefran{\c{c}}ois and
                  Simon Lemieux and
                  Nicholas L{\'{e}}onard and
                  Zhouhan Lin and
                  Jesse A. Livezey and
                  Cory Lorenz and
                  Jeremiah Lowin and
                  Qianli Ma and
                  Pierre{-}Antoine Manzagol and
                  Olivier Mastropietro and
                  Robert McGibbon and
                  Roland Memisevic and
                  Bart van Merri{\"{e}}nboer and
                  Vincent Michalski and
                  Mehdi Mirza and
                  Alberto Orlandi and
                  Christopher Joseph Pal and
                  Razvan Pascanu and
                  Mohammad Pezeshki and
                  Colin Raffel and
                  Daniel Renshaw and
                  Matthew Rocklin and
                  Adriana Romero and
                  Markus Roth and
                  Peter Sadowski and
                  John Salvatier and
                  Fran{\c{c}}ois Savard and
                  Jan Schl{\"{u}}ter and
                  John Schulman and
                  Gabriel Schwartz and
                  Iulian Vlad Serban and
                  Dmitriy Serdyuk and
                  Samira Shabanian and
                  {\'{E}}tienne Simon and
                  Sigurd Spieckermann and
                  S. Ramana Subramanyam and
                  Jakub Sygnowski and
                  J{\'{e}}r{\'{e}}mie Tanguay and
                  Gijs van Tulder and
                  Joseph P. Turian and
                  Sebastian Urban and
                  Pascal Vincent and
                  Francesco Visin and
                  Harm de Vries and
                  David Warde{-}Farley and
                  Dustin J. Webb and
                  Matthew Willson and
                  Kelvin Xu and
                  Lijun Xue and
                  Li Yao and
                  Saizheng Zhang and
                  Ying Zhang},
  title        = {Theano: {A} Python framework for fast computation of mathematical
                  expressions},
  journal      = {CoRR},
  volume       = {abs/1605.02688},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.02688},
  eprinttype    = {arXiv},
  eprint       = {1605.02688},
  timestamp    = {Thu, 30 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Al-RfouAAa16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauBXGLPCB16,
  author       = {Dzmitry Bahdanau and
                  Philemon Brakel and
                  Kelvin Xu and
                  Anirudh Goyal and
                  Ryan Lowe and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {An Actor-Critic Algorithm for Sequence Prediction},
  journal      = {CoRR},
  volume       = {abs/1607.07086},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.07086},
  eprinttype    = {arXiv},
  eprint       = {1607.07086},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauBXGLPCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChorowskiBSCB15,
  author       = {Jan Chorowski and
                  Dzmitry Bahdanau and
                  Dmitriy Serdyuk and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {Attention-Based Models for Speech Recognition},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {577--585},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/1068c6e4c8051cfd4e9ea8072e3189e2-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ChorowskiBSCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/BahdanauCB14,
  author       = {Dzmitry Bahdanau and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Neural Machine Translation by Jointly Learning to Align and Translate},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1409.0473},
  timestamp    = {Wed, 17 Jul 2019 10:40:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MerrienboerBDSW15,
  author       = {Bart van Merri{\"{e}}nboer and
                  Dzmitry Bahdanau and
                  Vincent Dumoulin and
                  Dmitriy Serdyuk and
                  David Warde{-}Farley and
                  Jan Chorowski and
                  Yoshua Bengio},
  title        = {Blocks and Fuel: Frameworks for deep learning},
  journal      = {CoRR},
  volume       = {abs/1506.00619},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.00619},
  eprinttype    = {arXiv},
  eprint       = {1506.00619},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MerrienboerBDSW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChorowskiBSCB15,
  author       = {Jan Chorowski and
                  Dzmitry Bahdanau and
                  Dmitriy Serdyuk and
                  KyungHyun Cho and
                  Yoshua Bengio},
  title        = {Attention-Based Models for Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1506.07503},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.07503},
  eprinttype    = {arXiv},
  eprint       = {1506.07503},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChorowskiBSCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauCSBB15,
  author       = {Dzmitry Bahdanau and
                  Jan Chorowski and
                  Dmitriy Serdyuk and
                  Philemon Brakel and
                  Yoshua Bengio},
  title        = {End-to-End Attention-based Large Vocabulary Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1508.04395},
  year         = {2015},
  url          = {http://arxiv.org/abs/1508.04395},
  eprinttype    = {arXiv},
  eprint       = {1508.04395},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauCSBB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauSBKCCB15,
  author       = {Dzmitry Bahdanau and
                  Dmitriy Serdyuk and
                  Philemon Brakel and
                  Nan Rosemary Ke and
                  Jan Chorowski and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Task Loss Estimation for Sequence Prediction},
  journal      = {CoRR},
  volume       = {abs/1511.06456},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.06456},
  eprinttype    = {arXiv},
  eprint       = {1511.06456},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauSBKCCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChoMGBBSB14,
  author       = {Kyunghyun Cho and
                  Bart van Merrienboer and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Dzmitry Bahdanau and
                  Fethi Bougares and
                  Holger Schwenk and
                  Yoshua Bengio},
  editor       = {Alessandro Moschitti and
                  Bo Pang and
                  Walter Daelemans},
  title        = {Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical
                  Machine Translation},
  booktitle    = {Proceedings of the 2014 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2014, October 25-29, 2014, Doha, Qatar,
                  {A} meeting of SIGDAT, a Special Interest Group of the {ACL}},
  pages        = {1724--1734},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/d14-1179},
  doi          = {10.3115/V1/D14-1179},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChoMGBBSB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssst/Pouget-AbadieBM14,
  author       = {Jean Pouget{-}Abadie and
                  Dzmitry Bahdanau and
                  Bart van Merrienboer and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Dekai Wu and
                  Marine Carpuat and
                  Xavier Carreras and
                  Eva Maria Vecchi},
  title        = {Overcoming the Curse of Sentence Length for Neural Machine Translation
                  using Automatic Segmentation},
  booktitle    = {Proceedings of SSST@EMNLP 2014, Eighth Workshop on Syntax, Semantics
                  and Structure in Statistical Translation, Doha, Qatar, 25 October
                  2014},
  pages        = {78--85},
  publisher    = {Association for Computational Linguistics},
  year         = {2014},
  url          = {https://aclanthology.org/W14-4009/},
  doi          = {10.3115/V1/W14-4009},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssst/Pouget-AbadieBM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssst/ChoMBB14,
  author       = {Kyunghyun Cho and
                  Bart van Merrienboer and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  editor       = {Dekai Wu and
                  Marine Carpuat and
                  Xavier Carreras and
                  Eva Maria Vecchi},
  title        = {On the Properties of Neural Machine Translation: Encoder-Decoder Approaches},
  booktitle    = {Proceedings of SSST@EMNLP 2014, Eighth Workshop on Syntax, Semantics
                  and Structure in Statistical Translation, Doha, Qatar, 25 October
                  2014},
  pages        = {103--111},
  publisher    = {Association for Computational Linguistics},
  year         = {2014},
  url          = {https://aclanthology.org/W14-4012/},
  doi          = {10.3115/V1/W14-4012},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssst/ChoMBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/Pouget-AbadieBMCB14,
  author       = {Jean Pouget{-}Abadie and
                  Dzmitry Bahdanau and
                  Bart van Merrienboer and
                  KyungHyun Cho and
                  Yoshua Bengio},
  title        = {Overcoming the Curse of Sentence Length for Neural Machine Translation
                  using Automatic Segmentation},
  journal      = {CoRR},
  volume       = {abs/1409.1257},
  year         = {2014},
  url          = {http://arxiv.org/abs/1409.1257},
  eprinttype    = {arXiv},
  eprint       = {1409.1257},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Pouget-AbadieBMCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChoMBB14,
  author       = {KyungHyun Cho and
                  Bart van Merrienboer and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {On the Properties of Neural Machine Translation: Encoder-Decoder Approaches},
  journal      = {CoRR},
  volume       = {abs/1409.1259},
  year         = {2014},
  url          = {http://arxiv.org/abs/1409.1259},
  eprinttype    = {arXiv},
  eprint       = {1409.1259},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChoMBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChorowskiBCB14,
  author       = {Jan Chorowski and
                  Dzmitry Bahdanau and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {End-to-end Continuous Speech Recognition using Attention-based Recurrent
                  {NN:} First Results},
  journal      = {CoRR},
  volume       = {abs/1412.1602},
  year         = {2014},
  url          = {http://arxiv.org/abs/1412.1602},
  eprinttype    = {arXiv},
  eprint       = {1412.1602},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChorowskiBCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics