BibTeX records: Richard Socher

download as .bib file

@article{DBLP:journals/corr/abs-2402-06196,
  author       = {Shervin Minaee and
                  Tom{\'{a}}s Mikolov and
                  Narjes Nikzad and
                  Meysam Chenaghlu and
                  Richard Socher and
                  Xavier Amatriain and
                  Jianfeng Gao},
  title        = {Large Language Models: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2402.06196},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.06196},
  doi          = {10.48550/ARXIV.2402.06196},
  eprinttype    = {arXiv},
  eprint       = {2402.06196},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-06196.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npjdm/EstevaFWHSDCSMS23,
  author       = {Andre Esteva and
                  Jean Feng and
                  Douwe van der Wal and
                  Shih{-}Cheng Huang and
                  Jeffry P. Simko and
                  Sandy Devries and
                  Emmalyn Chen and
                  Edward M. Schaeffer and
                  Todd M. Morgan and
                  Yilun Sun and
                  Amirata Ghorbani and
                  Nikhil Naik and
                  Dhruv Nathawani and
                  Richard Socher and
                  Jeff M. Michalski and
                  Mack Roach and
                  Thomas M. Pisansky and
                  Jedidiah M. Monson and
                  Farah Naz and
                  James Wallace and
                  Michelle J. Ferguson and
                  Jean{-}Paul Bahary and
                  James Zou and
                  Matthew P. Lungren and
                  Serena Yeung and
                  Ashley E. Ross and
                  Michael J. Kucharczyk and
                  Luis Souhami and
                  Leslie Ballas and
                  Christopher A. Peters and
                  Sandy Liu and
                  Alexander G. Balogh and
                  Pamela D. Randolph{-}Jackson and
                  David L. Schwartz and
                  Michael R. Girvigian and
                  Naoyuki G. Saito and
                  Adam Raben and
                  Rachel A. Rabinovitch and
                  Khalil Katato and
                  Howard M. Sandler and
                  Phuoc T. Tran and
                  Daniel E. Spratt and
                  Stephanie Pugh and
                  Felix Y. Feng and
                  Osama Mohamad},
  title        = {Author Correction: Prostate cancer therapy personalization via multi-modal
                  deep learning on randomized phase {III} clinical trials},
  journal      = {npj Digit. Medicine},
  volume       = {6},
  year         = {2023},
  url          = {https://doi.org/10.1038/s41746-023-00769-z},
  doi          = {10.1038/S41746-023-00769-Z},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/npjdm/EstevaFWHSDCSMS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npjdm/EstevaFWHSDCSMS22,
  author       = {Andre Esteva and
                  Jean Feng and
                  Douwe van der Wal and
                  Shih{-}Cheng Huang and
                  Jeffry P. Simko and
                  Sandy Devries and
                  Emmalyn Chen and
                  Edward M. Schaeffer and
                  Todd M. Morgan and
                  Yilun Sun and
                  Amirata Ghorbani and
                  Nikhil Naik and
                  Dhruv Nathawani and
                  Richard Socher and
                  Jeff M. Michalski and
                  Mack Roach and
                  Thomas M. Pisansky and
                  Jedidiah M. Monson and
                  Farah Naz and
                  James Wallace and
                  Michelle J. Ferguson and
                  Jean{-}Paul Bahary and
                  James Zou and
                  Matthew P. Lungren and
                  Serena Yeung and
                  Ashley E. Ross and
                  Michael J. Kucharczyk and
                  Luis Souhami and
                  Leslie Ballas and
                  Christopher A. Peters and
                  Sandy Liu and
                  Alexander G. Balogh and
                  Pamela D. Randolph{-}Jackson and
                  David L. Schwartz and
                  Michael R. Girvigian and
                  Naoyuki G. Saito and
                  Adam Raben and
                  Rachel A. Rabinovitch and
                  Khalil Katato and
                  Howard M. Sandler and
                  Phuoc T. Tran and
                  Daniel E. Spratt and
                  Stephanie Pugh and
                  Felix Y. Feng and
                  Osama Mohamad},
  title        = {Prostate cancer therapy personalization via multi-modal deep learning
                  on randomized phase {III} clinical trials},
  journal      = {npj Digit. Medicine},
  volume       = {5},
  year         = {2022},
  url          = {https://doi.org/10.1038/s41746-022-00613-w},
  doi          = {10.1038/S41746-022-00613-W},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/npjdm/EstevaFWHSDCSMS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-12187,
  author       = {Tian Xie and
                  Xinyi Yang and
                  Angela S. Lin and
                  Feihong Wu and
                  Kazuma Hashimoto and
                  Jin Qu and
                  Young Mo Kang and
                  Wenpeng Yin and
                  Huan Wang and
                  Semih Yavuz and
                  Gang Wu and
                  Michael Jones and
                  Richard Socher and
                  Yingbo Zhou and
                  Wenhao Liu and
                  Caiming Xiong},
  title        = {Converse: {A} Tree-Based Modular Task-Oriented Dialogue System},
  journal      = {CoRR},
  volume       = {abs/2203.12187},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.12187},
  doi          = {10.48550/ARXIV.2203.12187},
  eprinttype    = {arXiv},
  eprint       = {2203.12187},
  timestamp    = {Mon, 04 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-12187.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npjdm/EstevaCYNMM0TDS21,
  author       = {Andre Esteva and
                  Katherine Chou and
                  Serena Yeung and
                  Nikhil Naik and
                  Ali Madani and
                  Ali Mottaghi and
                  Yun Liu and
                  Eric J. Topol and
                  Jeff Dean and
                  Richard Socher},
  title        = {Deep learning-enabled medical computer vision},
  journal      = {npj Digit. Medicine},
  volume       = {4},
  year         = {2021},
  url          = {https://doi.org/10.1038/s41746-020-00376-2},
  doi          = {10.1038/S41746-020-00376-2},
  timestamp    = {Wed, 01 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/npjdm/EstevaCYNMM0TDS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npjdm/EstevaKPH0RS21,
  author       = {Andre Esteva and
                  Anuprit Kale and
                  Romain Paulus and
                  Kazuma Hashimoto and
                  Wenpeng Yin and
                  Dragomir Radev and
                  Richard Socher},
  title        = {{COVID-19} information retrieval with deep-learning based semantic
                  search, question answering, and abstractive summarization},
  journal      = {npj Digit. Medicine},
  volume       = {4},
  year         = {2021},
  url          = {https://doi.org/10.1038/s41746-021-00437-0},
  doi          = {10.1038/S41746-021-00437-0},
  timestamp    = {Mon, 01 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/npjdm/EstevaKPH0RS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npjdm/WalJLNRRTW0FMSS21,
  author       = {Douwe van der Wal and
                  Iny Jhun and
                  Israa Laklouk and
                  Jeffrey J. Nirschl and
                  Lara Richer and
                  Rebecca Rojansky and
                  Talent Theparee and
                  Joshua Wheeler and
                  J{\"{o}}rg Sander and
                  Felix Y. Feng and
                  Osama Mohamad and
                  Silvio Savarese and
                  Richard Socher and
                  Andre Esteva},
  title        = {Biological data annotation via a human-augmenting AI-based labeling
                  system},
  journal      = {npj Digit. Medicine},
  volume       = {4},
  year         = {2021},
  url          = {https://doi.org/10.1038/s41746-021-00520-6},
  doi          = {10.1038/S41746-021-00520-6},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/npjdm/WalJLNRRTW0FMSS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tacl/FabbriKMXSR21,
  author       = {Alexander R. Fabbri and
                  Wojciech Kryscinski and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher and
                  Dragomir R. Radev},
  title        = {SummEval: Re-evaluating Summarization Evaluation},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {9},
  pages        = {391--409},
  year         = {2021},
  url          = {https://doi.org/10.1162/tacl\_a\_00373},
  doi          = {10.1162/TACL\_A\_00373},
  timestamp    = {Fri, 10 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/FabbriKMXSR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/GaoZXSX21,
  author       = {Mingfei Gao and
                  Yingbo Zhou and
                  Ran Xu and
                  Richard Socher and
                  Caiming Xiong},
  title        = {{WOAD:} Weakly Supervised Online Action Detection in Untrimmed Videos},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2021, virtual, June 19-25, 2021},
  pages        = {1915--1923},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2021},
  url          = {https://openaccess.thecvf.com/content/CVPR2021/html/Gao\_WOAD\_Weakly\_Supervised\_Online\_Action\_Detection\_in\_Untrimmed\_Videos\_CVPR\_2021\_paper.html},
  doi          = {10.1109/CVPR46437.2021.00195},
  timestamp    = {Mon, 18 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/GaoZXSX21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/KrauseGMKJSR21,
  author       = {Ben Krause and
                  Akhilesh Deepak Gotmare and
                  Bryan McCann and
                  Nitish Shirish Keskar and
                  Shafiq R. Joty and
                  Richard Socher and
                  Nazneen Fatema Rajani},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {GeDi: Generative Discriminator Guided Sequence Generation},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November,
                  2021},
  pages        = {4929--4952},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-emnlp.424},
  doi          = {10.18653/V1/2021.FINDINGS-EMNLP.424},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/KrauseGMKJSR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/0009WLWTYRSX21,
  author       = {Tao Yu and
                  Chien{-}Sheng Wu and
                  Xi Victoria Lin and
                  Bailin Wang and
                  Yi Chern Tan and
                  Xinyi Yang and
                  Dragomir R. Radev and
                  Richard Socher and
                  Caiming Xiong},
  title        = {GraPPa: Grammar-Augmented Pre-Training for Table Semantic Parsing},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=kyaIeYj4zZ},
  timestamp    = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/0009WLWTYRSX21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/VigMVXSR21,
  author       = {Jesse Vig and
                  Ali Madani and
                  Lav R. Varshney and
                  Caiming Xiong and
                  Richard Socher and
                  Nazneen Fatema Rajani},
  title        = {BERTology Meets Biology: Interpreting Attention in Protein Language
                  Models},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=YWtLZvLmud7},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/VigMVXSR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JastrzebskiAAKW21,
  author       = {Stanislaw Jastrzebski and
                  Devansh Arpit and
                  Oliver {\AA}strand and
                  Giancarlo Kerg and
                  Huan Wang and
                  Caiming Xiong and
                  Richard Socher and
                  Kyunghyun Cho and
                  Krzysztof J. Geras},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Catastrophic Fisher Explosion: Early Phase Fisher Matrix Impacts Generalization},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {4772--4784},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/jastrzebski21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/JastrzebskiAAKW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/NanRZRSHTVVKLIP21,
  author       = {Linyong Nan and
                  Dragomir R. Radev and
                  Rui Zhang and
                  Amrit Rau and
                  Abhinand Sivaprasad and
                  Chiachun Hsieh and
                  Xiangru Tang and
                  Aadit Vyas and
                  Neha Verma and
                  Pranav Krishna and
                  Yangxiaokang Liu and
                  Nadia Irwanto and
                  Jessica Pan and
                  Faiaz Rahman and
                  Ahmad Zaidi and
                  Mutethia Mutuma and
                  Yasin Tarabar and
                  Ankit Gupta and
                  Tao Yu and
                  Yi Chern Tan and
                  Xi Victoria Lin and
                  Caiming Xiong and
                  Richard Socher and
                  Nazneen Fatema Rajani},
  editor       = {Kristina Toutanova and
                  Anna Rumshisky and
                  Luke Zettlemoyer and
                  Dilek Hakkani{-}T{\"{u}}r and
                  Iz Beltagy and
                  Steven Bethard and
                  Ryan Cotterell and
                  Tanmoy Chakraborty and
                  Yichao Zhou},
  title        = {{DART:} Open-Domain Structured Data Record to Text Generation},
  booktitle    = {Proceedings of the 2021 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2021, Online, June 6-11, 2021},
  pages        = {432--447},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.naacl-main.37},
  doi          = {10.18653/V1/2021.NAACL-MAIN.37},
  timestamp    = {Fri, 06 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/NanRZRSHTVVKLIP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/TheisenWVXS21,
  author       = {Ryan Theisen and
                  Huan Wang and
                  Lav R. Varshney and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Evaluating State-of-the-Art Classification Models Against Bayes Optimality},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {9367--9377},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/4e0ccd2b894f717df5ebc12f4282ee70-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/TheisenWVXS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-03357,
  author       = {Ryan Theisen and
                  Huan Wang and
                  Lav R. Varshney and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Evaluating State-of-the-Art Classification Models Against Bayes Optimality},
  journal      = {CoRR},
  volume       = {abs/2106.03357},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.03357},
  eprinttype    = {arXiv},
  eprint       = {2106.03357},
  timestamp    = {Fri, 11 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-03357.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-02755,
  author       = {Stephan Zheng and
                  Alexander Trott and
                  Sunil Srinivasa and
                  David C. Parkes and
                  Richard Socher},
  title        = {The {AI} Economist: Optimal Economic Policy Design via Two-level Deep
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2108.02755},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.02755},
  eprinttype    = {arXiv},
  eprint       = {2108.02755},
  timestamp    = {Wed, 11 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-02755.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZengLHSXLK20,
  author       = {Jichuan Zeng and
                  Xi Victoria Lin and
                  Steven C. H. Hoi and
                  Richard Socher and
                  Caiming Xiong and
                  Michael R. Lyu and
                  Irwin King},
  editor       = {Asli Celikyilmaz and
                  Tsung{-}Hsien Wen},
  title        = {Photon: {A} Robust Cross-Domain Text-to-SQL System},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics: System Demonstrations, {ACL} 2020, Online, July 5-10,
                  2020},
  pages        = {204--214},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-demos.24},
  doi          = {10.18653/V1/2020.ACL-DEMOS.24},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZengLHSXLK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/GaoWJXSKLH20,
  author       = {Yifan Gao and
                  Chien{-}Sheng Wu and
                  Shafiq R. Joty and
                  Caiming Xiong and
                  Richard Socher and
                  Irwin King and
                  Michael R. Lyu and
                  Steven C. H. Hoi},
  editor       = {Dan Jurafsky and
                  Joyce Chai and
                  Natalie Schluter and
                  Joel R. Tetreault},
  title        = {Explicit Memory Tracker with Coarse-to-Fine Reasoning for Conversational
                  Machine Reading},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2020, Online, July 5-10, 2020},
  pages        = {935--945},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-main.88},
  doi          = {10.18653/V1/2020.ACL-MAIN.88},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/GaoWJXSKLH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/TanJKS20,
  author       = {Samson Tan and
                  Shafiq R. Joty and
                  Min{-}Yen Kan and
                  Richard Socher},
  editor       = {Dan Jurafsky and
                  Joyce Chai and
                  Natalie Schluter and
                  Joel R. Tetreault},
  title        = {It's Morphin' Time! Combating Linguistic Discrimination with Inflectional
                  Perturbations},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2020, Online, July 5-10, 2020},
  pages        = {2920--2935},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-main.263},
  doi          = {10.18653/V1/2020.ACL-MAIN.263},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/TanJKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DeYoungJRLXSW20,
  author       = {Jay DeYoung and
                  Sarthak Jain and
                  Nazneen Fatema Rajani and
                  Eric Lehman and
                  Caiming Xiong and
                  Richard Socher and
                  Byron C. Wallace},
  editor       = {Dan Jurafsky and
                  Joyce Chai and
                  Natalie Schluter and
                  Joel R. Tetreault},
  title        = {{ERASER:} {A} Benchmark to Evaluate Rationalized {NLP} Models},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2020, Online, July 5-10, 2020},
  pages        = {4443--4458},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-main.408},
  doi          = {10.18653/V1/2020.ACL-MAIN.408},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/DeYoungJRLXSW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/RajaniZTZWVGXSR20,
  author       = {Nazneen Fatema Rajani and
                  Rui Zhang and
                  Yi Chern Tan and
                  Stephan Zheng and
                  Jeremy Weiss and
                  Aadit Vyas and
                  Abhijit Gupta and
                  Caiming Xiong and
                  Richard Socher and
                  Dragomir R. Radev},
  editor       = {Dan Jurafsky and
                  Joyce Chai and
                  Natalie Schluter and
                  Joel R. Tetreault},
  title        = {{ESPRIT:} Explaining Solutions to Physical Reasoning Tasks},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2020, Online, July 5-10, 2020},
  pages        = {7906--7917},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-main.706},
  doi          = {10.18653/V1/2020.ACL-MAIN.706},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/RajaniZTZWVGXSR20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/WangKXS20,
  author       = {Huan Wang and
                  Nitish Shirish Keskar and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Silvia Chiappa and
                  Roberto Calandra},
  title        = {Assessing Local Generalization Capability in Deep Models},
  booktitle    = {The 23rd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]},
  series       = {Proceedings of Machine Learning Research},
  volume       = {108},
  pages        = {2077--2087},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v108/wang20f.html},
  timestamp    = {Mon, 29 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/WangKXS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/LiWZXSD20,
  author       = {Hengduo Li and
                  Zuxuan Wu and
                  Chen Zhu and
                  Caiming Xiong and
                  Richard Socher and
                  Larry S. Davis},
  title        = {Learning From Noisy Anchors for One-Stage Object Detection},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {10585--10594},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Li\_Learning\_From\_Noisy\_Anchors\_for\_One-Stage\_Object\_Detection\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.01060},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/LiWZXSD20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WuHSX20,
  author       = {Chien{-}Sheng Wu and
                  Steven C. H. Hoi and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {{TOD-BERT:} Pre-trained Natural Language Understanding for Task-Oriented
                  Dialogue},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {917--929},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.66},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.66},
  timestamp    = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/WuHSX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/XiaXYS20,
  author       = {Congying Xia and
                  Caiming Xiong and
                  Philip S. Yu and
                  Richard Socher},
  editor       = {Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Composed Variational Natural Language Generation for Few-shot Intents},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2020, Online Event, 16-20 November 2020},
  series       = {Findings of {ACL}},
  volume       = {{EMNLP} 2020},
  pages        = {3379--3388},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.findings-emnlp.303},
  doi          = {10.18653/V1/2020.FINDINGS-EMNLP.303},
  timestamp    = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/XiaXYS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/LinSX20,
  author       = {Xi Victoria Lin and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Bridging Textual and Tabular Data for Cross-Domain Text-to-SQL Semantic
                  Parsing},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2020, Online Event, 16-20 November 2020},
  series       = {Findings of {ACL}},
  volume       = {{EMNLP} 2020},
  pages        = {4870--4888},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.findings-emnlp.438},
  doi          = {10.18653/V1/2020.FINDINGS-EMNLP.438},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/LinSX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhangHLWWYSX20,
  author       = {Jian{-}Guo Zhang and
                  Kazuma Hashimoto and
                  Wenhao Liu and
                  Chien{-}Sheng Wu and
                  Yao Wan and
                  Philip S. Yu and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Discriminative Nearest Neighbor Few-Shot Intent Detection by Transferring
                  Natural Language Inference},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {5064--5082},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.411},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.411},
  timestamp    = {Tue, 13 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhangHLWWYSX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/YavuzHLKSX20,
  author       = {Semih Yavuz and
                  Kazuma Hashimoto and
                  Wenhao Liu and
                  Nitish Shirish Keskar and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Simple Data Augmentation with the Mask Token Improves Domain Adaptation
                  for Dialog Act Tagging},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {5083--5089},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.412},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.412},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/YavuzHLKSX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/KeskarMXS20,
  author       = {Nitish Shirish Keskar and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {The Thieves on Sesame Street are Polyglots - Extracting Multilingual
                  Models from Monolingual APIs},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {6203--6207},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.501},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.501},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/KeskarMXS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/YinRRSX20,
  author       = {Wenpeng Yin and
                  Nazneen Fatema Rajani and
                  Dragomir R. Radev and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Universal Natural Language Processing with Limited Annotations: Try
                  Few-shot Textual Entailment as a Start},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {8229--8239},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.660},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.660},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/YinRRSX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/KryscinskiMXS20,
  author       = {Wojciech Kryscinski and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Evaluating the Factual Consistency of Abstractive Text Summarization},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {9332--9346},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.750},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.750},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/KryscinskiMXS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/AsaiHHSX20,
  author       = {Akari Asai and
                  Kazuma Hashimoto and
                  Hannaneh Hajishirzi and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Learning to Retrieve Reasoning Paths over Wikipedia Graph for Question
                  Answering},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=SJgVHkrYDH},
  timestamp    = {Thu, 07 May 2020 17:11:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/AsaiHHSX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LeSH20,
  author       = {Hung Le and
                  Richard Socher and
                  Steven C. H. Hoi},
  title        = {Non-Autoregressive Dialog State Tracking},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=H1e\_cC4twS},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LeSH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LiSH20,
  author       = {Junnan Li and
                  Richard Socher and
                  Steven C. H. Hoi},
  title        = {DivideMix: Learning with Noisy Labels as Semi-supervised Learning},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=HJgExaVtwr},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/LiSH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/NguyenJHS20,
  author       = {Xuan{-}Phi Nguyen and
                  Shafiq R. Joty and
                  Steven C. H. Hoi and
                  Richard Socher},
  title        = {Tree-Structured Attention with Hierarchical Accumulation},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=HJxK5pEYvr},
  timestamp    = {Fri, 17 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/NguyenJHS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/CamposTXSGT20,
  author       = {Victor Campos and
                  Alexander Trott and
                  Caiming Xiong and
                  Richard Socher and
                  Xavier Gir{\'{o}}{-}i{-}Nieto and
                  Jordi Torres},
  title        = {Explore, Discover and Learn: Unsupervised Discovery of State-Covering
                  Skills},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {1317--1327},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/campos20a.html},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/CamposTXSGT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WangWBZXS20,
  author       = {Weiran Wang and
                  Guangsen Wang and
                  Aadyot Bhatnagar and
                  Yingbo Zhou and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {An Investigation of Phone-Based Subword Units for End-to-End Speech
                  Recognition},
  booktitle    = {Interspeech 2020, 21st Annual Conference of the International Speech
                  Communication Association, Virtual Event, Shanghai, China, 25-29 October
                  2020},
  pages        = {1778--1782},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-1873},
  doi          = {10.21437/INTERSPEECH.2020-1873},
  timestamp    = {Fri, 29 Jan 2021 17:40:16 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/WangWBZXS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ita/VarshneyKS20,
  author       = {Lav R. Varshney and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Limits of Detecting Text Generated by Large-Scale Language Models},
  booktitle    = {Information Theory and Applications Workshop, {ITA} 2020, San Diego,
                  CA, USA, February 2-7, 2020},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ITA50056.2020.9245012},
  doi          = {10.1109/ITA50056.2020.9245012},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ita/VarshneyKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChenBLZWXS20,
  author       = {Minshuo Chen and
                  Yu Bai and
                  Jason D. Lee and
                  Tuo Zhao and
                  Huan Wang and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Towards Understanding Hierarchical Learning: Benefits of Neural Representations},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/fb647ca6672b0930e9d00dc384d8b16f-Abstract.html},
  timestamp    = {Sat, 15 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ChenBLZWXS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Hosseini-AslMWY20,
  author       = {Ehsan Hosseini{-}Asl and
                  Bryan McCann and
                  Chien{-}Sheng Wu and
                  Semih Yavuz and
                  Richard Socher},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {A Simple Language Model for Task-Oriented Dialogue},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/e946209592563be0f01c844ab2170f0c-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Hosseini-AslMWY20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YaoZMLSX20,
  author       = {Huaxiu Yao and
                  Yingbo Zhou and
                  Mehrdad Mahdavi and
                  Zhenhui Li and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Online Structured Meta-learning},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/4b86ca48d90bd5f0978afa3a012503a4-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YaoZMLSX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhouXSH20,
  author       = {Pan Zhou and
                  Caiming Xiong and
                  Richard Socher and
                  Steven Chu{-}Hong Hoi},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Theory-Inspired Path-Regularized Differential Network Architecture
                  Search},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/5e1b18c4c6a6d31695acbae3fd70ecc6-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZhouXSH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/starsem/ZhangHWWYSX20,
  author       = {Jian{-}Guo Zhang and
                  Kazuma Hashimoto and
                  Chien{-}Sheng Wu and
                  Yao Wan and
                  Philip S. Yu and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Iryna Gurevych and
                  Marianna Apidianaki and
                  Manaal Faruqui},
  title        = {Find or Classify? Dual Strategy for Slot-Value Predictions on Multi-Domain
                  Dialog State Tracking},
  booktitle    = {Proceedings of the Ninth Joint Conference on Lexical and Computational
                  Semantics, *SEM@COLING 2020, Barcelona, Spain (Online), December 12-13,
                  2020},
  pages        = {154--167},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://aclanthology.org/2020.starsem-1.17/},
  timestamp    = {Thu, 08 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/starsem/ZhangHWWYSX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-03438,
  author       = {Lav R. Varshney and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Limits of Detecting Text Generated by Large-Scale Language Models},
  journal      = {CoRR},
  volume       = {abs/2002.03438},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.03438},
  eprinttype    = {arXiv},
  eprint       = {2002.03438},
  timestamp    = {Wed, 12 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-03438.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-03647,
  author       = {V{\'{\i}}ctor Campos and
                  Alexander Trott and
                  Caiming Xiong and
                  Richard Socher and
                  Xavier Gir{\'{o}}{-}i{-}Nieto and
                  Jordi Torres},
  title        = {Explore, Discover and Learn: Unsupervised Discovery of State-Covering
                  Skills},
  journal      = {CoRR},
  volume       = {abs/2002.03647},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.03647},
  eprinttype    = {arXiv},
  eprint       = {2002.03647},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-03647.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-04010,
  author       = {Yu Bai and
                  Ben Krause and
                  Huan Wang and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Taylorized Training: Towards Better Approximation of Neural Network
                  Training at Finite Width},
  journal      = {CoRR},
  volume       = {abs/2002.04010},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.04010},
  eprinttype    = {arXiv},
  eprint       = {2002.04010},
  timestamp    = {Sat, 15 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-04010.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-07394,
  author       = {Junnan Li and
                  Richard Socher and
                  Steven C. H. Hoi},
  title        = {DivideMix: Learning with Noisy Labels as Semi-supervised Learning},
  journal      = {CoRR},
  volume       = {abs/2002.07394},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.07394},
  eprinttype    = {arXiv},
  eprint       = {2002.07394},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-07394.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-08024,
  author       = {Hung Le and
                  Richard Socher and
                  Steven C. H. Hoi},
  title        = {Non-Autoregressive Dialog State Tracking},
  journal      = {CoRR},
  volume       = {abs/2002.08024},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.08024},
  eprinttype    = {arXiv},
  eprint       = {2002.08024},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-08024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-08046,
  author       = {Xuan{-}Phi Nguyen and
                  Shafiq R. Joty and
                  Steven C. H. Hoi and
                  Richard Socher},
  title        = {Tree-structured Attention with Hierarchical Accumulation},
  journal      = {CoRR},
  volume       = {abs/2002.08046},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.08046},
  eprinttype    = {arXiv},
  eprint       = {2002.08046},
  timestamp    = {Fri, 17 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-08046.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-09046,
  author       = {Devansh Arpit and
                  Huan Wang and
                  Caiming Xiong and
                  Richard Socher and
                  Yoshua Bengio},
  title        = {Neural Bayes: {A} Generic Parameterization Method for Unsupervised
                  Representation Learning},
  journal      = {CoRR},
  volume       = {abs/2002.09046},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.09046},
  eprinttype    = {arXiv},
  eprint       = {2002.09046},
  timestamp    = {Tue, 03 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-09046.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-01285,
  author       = {Junnan Li and
                  Caiming Xiong and
                  Richard Socher and
                  Steven C. H. Hoi},
  title        = {Towards Noise-resistant Object Detection with Noisy Annotations},
  journal      = {CoRR},
  volume       = {abs/2003.01285},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.01285},
  eprinttype    = {arXiv},
  eprint       = {2003.01285},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-01285.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-13525,
  author       = {Isabela Albuquerque and
                  Nikhil Naik and
                  Junnan Li and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Improving out-of-distribution generalization via multi-task self-supervised
                  pretraining},
  journal      = {CoRR},
  volume       = {abs/2003.13525},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.13525},
  eprinttype    = {arXiv},
  eprint       = {2003.13525},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-13525.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-03497,
  author       = {Ali Madani and
                  Bryan McCann and
                  Nikhil Naik and
                  Nitish Shirish Keskar and
                  Namrata Anand and
                  Raphael R. Eguchi and
                  Po{-}Ssu Huang and
                  Richard Socher},
  title        = {ProGen: Language Modeling for Protein Generation},
  journal      = {CoRR},
  volume       = {abs/2004.03497},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.03497},
  eprinttype    = {arXiv},
  eprint       = {2004.03497},
  timestamp    = {Wed, 08 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-03497.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-06871,
  author       = {Chien{-}Sheng Wu and
                  Steven C. H. Hoi and
                  Richard Socher and
                  Caiming Xiong},
  title        = {ToD-BERT: Pre-trained Natural Language Understanding for Task-Oriented
                  Dialogues},
  journal      = {CoRR},
  volume       = {abs/2004.06871},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.06871},
  eprinttype    = {arXiv},
  eprint       = {2004.06871},
  timestamp    = {Tue, 21 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-06871.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-13332,
  author       = {Stephan Zheng and
                  Alexander Trott and
                  Sunil Srinivasa and
                  Nikhil Naik and
                  Melvin Gruesbeck and
                  David C. Parkes and
                  Richard Socher},
  title        = {The {AI} Economist: Improving Equality and Productivity with AI-Driven
                  Tax Policies},
  journal      = {CoRR},
  volume       = {abs/2004.13332},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.13332},
  eprinttype    = {arXiv},
  eprint       = {2004.13332},
  timestamp    = {Sun, 03 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-13332.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-00730,
  author       = {Nazneen Fatema Rajani and
                  Rui Zhang and
                  Yi Chern Tan and
                  Stephan Zheng and
                  Jeremy Weiss and
                  Aadit Vyas and
                  Abhijit Gupta and
                  Caiming Xiong and
                  Richard Socher and
                  Dragomir R. Radev},
  title        = {{ESPRIT:} Explaining Solutions to Physical Reasoning Tasks},
  journal      = {CoRR},
  volume       = {abs/2005.00730},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.00730},
  eprinttype    = {arXiv},
  eprint       = {2005.00730},
  timestamp    = {Fri, 08 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-00730.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-00796,
  author       = {Ehsan Hosseini{-}Asl and
                  Bryan McCann and
                  Chien{-}Sheng Wu and
                  Semih Yavuz and
                  Richard Socher},
  title        = {A Simple Language Model for Task-Oriented Dialogue},
  journal      = {CoRR},
  volume       = {abs/2005.00796},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.00796},
  eprinttype    = {arXiv},
  eprint       = {2005.00796},
  timestamp    = {Fri, 08 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-00796.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-04364,
  author       = {Samson Tan and
                  Shafiq R. Joty and
                  Min{-}Yen Kan and
                  Richard Socher},
  title        = {It's Morphin' Time! Combating Linguistic Discrimination with Inflectional
                  Perturbations},
  journal      = {CoRR},
  volume       = {abs/2005.04364},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.04364},
  eprinttype    = {arXiv},
  eprint       = {2005.04364},
  timestamp    = {Fri, 17 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-04364.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-04966,
  author       = {Junnan Li and
                  Pan Zhou and
                  Caiming Xiong and
                  Richard Socher and
                  Steven C. H. Hoi},
  title        = {Prototypical Contrastive Learning of Unsupervised Representations},
  journal      = {CoRR},
  volume       = {abs/2005.04966},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.04966},
  eprinttype    = {arXiv},
  eprint       = {2005.04966},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-04966.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-12484,
  author       = {Yifan Gao and
                  Chien{-}Sheng Wu and
                  Shafiq R. Joty and
                  Caiming Xiong and
                  Richard Socher and
                  Irwin King and
                  Michael R. Lyu and
                  Steven C. H. Hoi},
  title        = {{EMT:} Explicit Memory Tracker with Coarse-to-Fine Reasoning for Conversational
                  Machine Reading},
  journal      = {CoRR},
  volume       = {abs/2005.12484},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.12484},
  eprinttype    = {arXiv},
  eprint       = {2005.12484},
  timestamp    = {Fri, 17 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-12484.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-03732,
  author       = {Mingfei Gao and
                  Yingbo Zhou and
                  Ran Xu and
                  Richard Socher and
                  Caiming Xiong},
  title        = {{WOAD:} Weakly Supervised Online Action Detection in Untrimmed Videos},
  journal      = {CoRR},
  volume       = {abs/2006.03732},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.03732},
  eprinttype    = {arXiv},
  eprint       = {2006.03732},
  timestamp    = {Fri, 12 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-03732.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-09595,
  author       = {Andre Esteva and
                  Anuprit Kale and
                  Romain Paulus and
                  Kazuma Hashimoto and
                  Wenpeng Yin and
                  Dragomir R. Radev and
                  Richard Socher},
  title        = {CO-Search: {COVID-19} Information Retrieval with Semantic Search,
                  Question Answering, and Abstractive Summarization},
  journal      = {CoRR},
  volume       = {abs/2006.09595},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.09595},
  eprinttype    = {arXiv},
  eprint       = {2006.09595},
  timestamp    = {Wed, 28 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-09595.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-13425,
  author       = {Kazuma Hashimoto and
                  Raffaella Buschiazzo and
                  James Bradbury and
                  Teresa Marshall and
                  Richard Socher and
                  Caiming Xiong},
  title        = {A High-Quality Multilingual Dataset for Structured Documentation Translation},
  journal      = {CoRR},
  volume       = {abs/2006.13425},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.13425},
  eprinttype    = {arXiv},
  eprint       = {2006.13425},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-13425.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-13436,
  author       = {Minshuo Chen and
                  Yu Bai and
                  Jason D. Lee and
                  Tuo Zhao and
                  Huan Wang and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Towards Understanding Hierarchical Learning: Benefits of Neural Representations},
  journal      = {CoRR},
  volume       = {abs/2006.13436},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.13436},
  eprinttype    = {arXiv},
  eprint       = {2006.13436},
  timestamp    = {Sat, 15 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-13436.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-15222,
  author       = {Jesse Vig and
                  Ali Madani and
                  Lav R. Varshney and
                  Caiming Xiong and
                  Richard Socher and
                  Nazneen Fatema Rajani},
  title        = {BERTology Meets Biology: Interpreting Attention in Protein Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2006.15222},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.15222},
  eprinttype    = {arXiv},
  eprint       = {2006.15222},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-15222.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-16537,
  author       = {Pan Zhou and
                  Caiming Xiong and
                  Richard Socher and
                  Steven C. H. Hoi},
  title        = {Theory-Inspired Path-Regularized Differential Network Architecture
                  Search},
  journal      = {CoRR},
  volume       = {abs/2006.16537},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.16537},
  eprinttype    = {arXiv},
  eprint       = {2006.16537},
  timestamp    = {Thu, 02 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-16537.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-02871,
  author       = {Dragomir R. Radev and
                  Rui Zhang and
                  Amrit Rau and
                  Abhinand Sivaprasad and
                  Chiachun Hsieh and
                  Nazneen Fatema Rajani and
                  Xiangru Tang and
                  Aadit Vyas and
                  Neha Verma and
                  Pranav Krishna and
                  Yangxiaokang Liu and
                  Nadia Irwanto and
                  Jessica Pan and
                  Faiaz Rahman and
                  Ahmad Zaidi and
                  Murori Mutuma and
                  Yasin Tarabar and
                  Ankit Gupta and
                  Tao Yu and
                  Yi Chern Tan and
                  Xi Victoria Lin and
                  Caiming Xiong and
                  Richard Socher},
  title        = {{DART:} Open-Domain Structured Data Record to Text Generation},
  journal      = {CoRR},
  volume       = {abs/2007.02871},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.02871},
  eprinttype    = {arXiv},
  eprint       = {2007.02871},
  timestamp    = {Fri, 06 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-02871.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-12626,
  author       = {Alexander R. Fabbri and
                  Wojciech Kryscinski and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher and
                  Dragomir R. Radev},
  title        = {SummEval: Re-evaluating Summarization Evaluation},
  journal      = {CoRR},
  volume       = {abs/2007.12626},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.12626},
  eprinttype    = {arXiv},
  eprint       = {2007.12626},
  timestamp    = {Wed, 29 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-12626.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-15280,
  author       = {Jichuan Zeng and
                  Xi Victoria Lin and
                  Caiming Xiong and
                  Richard Socher and
                  Michael R. Lyu and
                  Irwin King and
                  Steven C. H. Hoi},
  title        = {Photon: {A} Robust Cross-Domain Text-to-SQL System},
  journal      = {CoRR},
  volume       = {abs/2007.15280},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.15280},
  eprinttype    = {arXiv},
  eprint       = {2007.15280},
  timestamp    = {Mon, 03 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-15280.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-04087,
  author       = {Christopher Liu and
                  Laura Domin{\'{e}} and
                  Kevin Chavez and
                  Richard Socher},
  title        = {Central Yup'ik and Machine Translation of Low-Resource Polysynthetic
                  Languages},
  journal      = {CoRR},
  volume       = {abs/2009.04087},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.04087},
  eprinttype    = {arXiv},
  eprint       = {2009.04087},
  timestamp    = {Thu, 17 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-04087.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-06367,
  author       = {Ben Krause and
                  Akhilesh Deepak Gotmare and
                  Bryan McCann and
                  Nitish Shirish Keskar and
                  Shafiq R. Joty and
                  Richard Socher and
                  Nazneen Fatema Rajani},
  title        = {GeDi: Generative Discriminator Guided Sequence Generation},
  journal      = {CoRR},
  volume       = {abs/2009.06367},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.06367},
  eprinttype    = {arXiv},
  eprint       = {2009.06367},
  timestamp    = {Fri, 18 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-06367.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-10056,
  author       = {Congying Xia and
                  Caiming Xiong and
                  Philip S. Yu and
                  Richard Socher},
  title        = {Composed Variational Natural Language Generation for Few-shot Intents},
  journal      = {CoRR},
  volume       = {abs/2009.10056},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.10056},
  eprinttype    = {arXiv},
  eprint       = {2009.10056},
  timestamp    = {Wed, 23 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-10056.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-13845,
  author       = {Tao Yu and
                  Chien{-}Sheng Wu and
                  Xi Victoria Lin and
                  Bailin Wang and
                  Yi Chern Tan and
                  Xinyi Yang and
                  Dragomir R. Radev and
                  Richard Socher and
                  Caiming Xiong},
  title        = {GraPPa: Grammar-Augmented Pre-Training for Table Semantic Parsing},
  journal      = {CoRR},
  volume       = {abs/2009.13845},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.13845},
  eprinttype    = {arXiv},
  eprint       = {2009.13845},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-13845.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-02584,
  author       = {Wenpeng Yin and
                  Nazneen Fatema Rajani and
                  Dragomir R. Radev and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Universal Natural Language Processing with Limited Annotations: Try
                  Few-shot Textual Entailment as a Start},
  journal      = {CoRR},
  volume       = {abs/2010.02584},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.02584},
  eprinttype    = {arXiv},
  eprint       = {2010.02584},
  timestamp    = {Wed, 28 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-02584.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-07126,
  author       = {Lav R. Varshney and
                  Nazneen Fatema Rajani and
                  Richard Socher},
  title        = {Explaining Creative Artifacts},
  journal      = {CoRR},
  volume       = {abs/2010.07126},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.07126},
  eprinttype    = {arXiv},
  eprint       = {2010.07126},
  timestamp    = {Tue, 20 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-07126.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-09030,
  author       = {Nazneen Fatema Rajani and
                  Ben Krause and
                  Wengpeng Yin and
                  Tong Niu and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Explaining and Improving Model Behavior with k Nearest Neighbor Representations},
  journal      = {CoRR},
  volume       = {abs/2010.09030},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.09030},
  eprinttype    = {arXiv},
  eprint       = {2010.09030},
  timestamp    = {Wed, 21 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-09030.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-11545,
  author       = {Huaxiu Yao and
                  Yingbo Zhou and
                  Mehrdad Mahdavi and
                  Zhenhui Li and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Online Structured Meta-learning},
  journal      = {CoRR},
  volume       = {abs/2010.11545},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.11545},
  eprinttype    = {arXiv},
  eprint       = {2010.11545},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-11545.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-13009,
  author       = {Jian{-}Guo Zhang and
                  Kazuma Hashimoto and
                  Wenhao Liu and
                  Chien{-}Sheng Wu and
                  Yao Wan and
                  Philip S. Yu and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Discriminative Nearest Neighbor Few-Shot Intent Detection by Transferring
                  Natural Language Inference},
  journal      = {CoRR},
  volume       = {abs/2010.13009},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.13009},
  eprinttype    = {arXiv},
  eprint       = {2010.13009},
  timestamp    = {Tue, 13 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-13009.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-12627,
  author       = {Xi Victoria Lin and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Bridging Textual and Tabular Data for Cross-Domain Text-to-SQL Semantic
                  Parsing},
  journal      = {CoRR},
  volume       = {abs/2012.12627},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.12627},
  eprinttype    = {arXiv},
  eprint       = {2012.12627},
  timestamp    = {Tue, 05 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-12627.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-14193,
  author       = {Stanislaw Jastrzebski and
                  Devansh Arpit and
                  Oliver {\AA}strand and
                  Giancarlo Kerg and
                  Huan Wang and
                  Caiming Xiong and
                  Richard Socher and
                  Kyunghyun Cho and
                  Krzysztof J. Geras},
  title        = {Catastrophic Fisher Explosion: Early Phase Fisher Matrix Impacts Generalization},
  journal      = {CoRR},
  volume       = {abs/2012.14193},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.14193},
  eprinttype    = {arXiv},
  eprint       = {2012.14193},
  timestamp    = {Fri, 26 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-14193.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/WuMHXSF19,
  author       = {Chien{-}Sheng Wu and
                  Andrea Madotto and
                  Ehsan Hosseini{-}Asl and
                  Caiming Xiong and
                  Richard Socher and
                  Pascale Fung},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Transferable Multi-Domain State Generator for Task-Oriented Dialogue
                  Systems},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {808--819},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1078},
  doi          = {10.18653/V1/P19-1078},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WuMHXSF19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YuZYTLLELPCJDPS19,
  author       = {Tao Yu and
                  Rui Zhang and
                  Michihiro Yasunaga and
                  Yi Chern Tan and
                  Xi Victoria Lin and
                  Suyi Li and
                  Heyang Er and
                  Irene Li and
                  Bo Pang and
                  Tao Chen and
                  Emily Ji and
                  Shreya Dixit and
                  David Proctor and
                  Sungrok Shim and
                  Jonathan Kraft and
                  Vincent Zhang and
                  Caiming Xiong and
                  Richard Socher and
                  Dragomir R. Radev},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {SParC: Cross-Domain Semantic Parsing in Context},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {4511--4523},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1443},
  doi          = {10.18653/V1/P19-1443},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/YuZYTLLELPCJDPS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/RajaniMXS19,
  author       = {Nazneen Fatema Rajani and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Explain Yourself! Leveraging Language Models for Commonsense Reasoning},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {4932--4942},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1487},
  doi          = {10.18653/V1/P19-1487},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/RajaniMXS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl-deeplo/SinghMSX19,
  author       = {Jasdeep Singh and
                  Bryan McCann and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Colin Cherry and
                  Greg Durrett and
                  George F. Foster and
                  Reza Haffari and
                  Shahram Khadivi and
                  Nanyun Peng and
                  Xiang Ren and
                  Swabha Swayamdipta},
  title        = {{BERT} is Not an Interlingua and the Bias of Tokenization},
  booktitle    = {Proceedings of the 2nd Workshop on Deep Learning Approaches for Low-Resource
                  NLP, DeepLo@EMNLP-IJCNLP 2019, Hong Kong, China, November 3, 2019},
  pages        = {47--55},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-6106},
  doi          = {10.18653/V1/D19-6106},
  timestamp    = {Thu, 05 Aug 2021 17:36:17 +0200},
  biburl       = {https://dblp.org/rec/conf/acl-deeplo/SinghMSX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/WuXMSD19,
  author       = {Zuxuan Wu and
                  Caiming Xiong and
                  Chih{-}Yao Ma and
                  Richard Socher and
                  Larry S. Davis},
  title        = {AdaFrame: Adaptive Frame Selection for Fast Video Recognition},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2019, Long Beach, CA, USA, June 16-20, 2019},
  pages        = {1278--1287},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2019},
  url          = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Wu\_AdaFrame\_Adaptive\_Frame\_Selection\_for\_Fast\_Video\_Recognition\_CVPR\_2019\_paper.html},
  doi          = {10.1109/CVPR.2019.00137},
  timestamp    = {Mon, 30 Aug 2021 17:01:14 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/WuXMSD19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/KryscinskiKMXS19,
  author       = {Wojciech Kryscinski and
                  Nitish Shirish Keskar and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {Neural Text Summarization: {A} Critical Evaluation},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {540--551},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1051},
  doi          = {10.18653/V1/D19-1051},
  timestamp    = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/KryscinskiKMXS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/GaoDSX19,
  author       = {Mingfei Gao and
                  Larry Davis and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {{WSLLN:} Weakly Supervised Natural Language Localization Networks},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {1481--1487},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1157},
  doi          = {10.18653/V1/D19-1157},
  timestamp    = {Thu, 12 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/GaoDSX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/YuZELXPLTSLJYSC19,
  author       = {Tao Yu and
                  Rui Zhang and
                  Heyang Er and
                  Suyi Li and
                  Eric Xue and
                  Bo Pang and
                  Xi Victoria Lin and
                  Yi Chern Tan and
                  Tianze Shi and
                  Zihan Li and
                  Youxuan Jiang and
                  Michihiro Yasunaga and
                  Sungrok Shim and
                  Tao Chen and
                  Alexander R. Fabbri and
                  Zifan Li and
                  Luyao Chen and
                  Yuwen Zhang and
                  Shreya Dixit and
                  Vincent Zhang and
                  Caiming Xiong and
                  Richard Socher and
                  Walter S. Lasecki and
                  Dragomir R. Radev},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {CoSQL: {A} Conversational Text-to-SQL Challenge Towards Cross-Domain
                  Natural Language Interfaces to Databases},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {1962--1979},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1204},
  doi          = {10.18653/V1/D19-1204},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/YuZELXPLTSLJYSC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhangYESXLSXSR19,
  author       = {Rui Zhang and
                  Tao Yu and
                  Heyang Er and
                  Sungrok Shim and
                  Eric Xue and
                  Xi Victoria Lin and
                  Tianze Shi and
                  Caiming Xiong and
                  Richard Socher and
                  Dragomir R. Radev},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {Editing-Based {SQL} Query Generation for Cross-Domain Context-Dependent
                  Questions},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {5337--5348},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1537},
  doi          = {10.18653/V1/D19-1537},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhangYESXLSXSR19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/GaoX0SX19,
  author       = {Mingfei Gao and
                  Mingze Xu and
                  Larry Davis and
                  Richard Socher and
                  Caiming Xiong},
  title        = {StartNet: Online Detection of Action Start in Untrimmed Videos},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2019, Seoul, Korea (South), October 27 - November 2, 2019},
  pages        = {5541--5550},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCV.2019.00564},
  doi          = {10.1109/ICCV.2019.00564},
  timestamp    = {Thu, 05 Mar 2020 10:01:04 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/GaoX0SX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GotmareKXS19,
  author       = {Akhilesh Gotmare and
                  Nitish Shirish Keskar and
                  Caiming Xiong and
                  Richard Socher},
  title        = {A Closer Look at Deep Learning Heuristics: Learning rate restarts,
                  Warmup and Distillation},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=r14EOsCqKX},
  timestamp    = {Thu, 25 Jul 2019 13:03:15 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GotmareKXS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Hosseini-AslZXS19,
  author       = {Ehsan Hosseini{-}Asl and
                  Yingbo Zhou and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Augmented Cyclic Adversarial Learning for Low Resource Domain Adaptation},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=B1G9doA9F7},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Hosseini-AslZXS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LiuTSX19,
  author       = {Hao Liu and
                  Alexander Trott and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Competitive experience replay},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=Sklsm20ctX},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LiuTSX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MaLWAKSX19,
  author       = {Chih{-}Yao Ma and
                  Jiasen Lu and
                  Zuxuan Wu and
                  Ghassan AlRegib and
                  Zsolt Kira and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Self-Monitoring Navigation Agent via Auxiliary Progress Estimation},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=r1GAsjC5Fm},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MaLWAKSX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WuSX19,
  author       = {Chien{-}Sheng Wu and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Global-to-local Memory Pointer Networks for Task-Oriented Dialogue},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=ryxnHhRqFm},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WuSX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhongXKS19,
  author       = {Victor Zhong and
                  Caiming Xiong and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Coarse-grain Fine-grain Coattention Network for Multi-evidence Question
                  Answering},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=Syl7OsRqY7},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhongXKS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LiZWSX19,
  author       = {Xilai Li and
                  Yingbo Zhou and
                  Tianfu Wu and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Learn to Grow: {A} Continual Structure Learning Framework for Overcoming
                  Catastrophic Forgetting},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {3925--3934},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/li19m.html},
  timestamp    = {Wed, 13 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LiZWSX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LiuSX19,
  author       = {Hao Liu and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Taming {MAML:} Efficient unbiased meta-reinforcement learning},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {4061--4071},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/liu19g.html},
  timestamp    = {Tue, 11 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LiuSX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/WangZXS19,
  author       = {Huan Wang and
                  Stephan Zheng and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {On the Generalization Gap in Reparameterizable Reinforcement Learning},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {6648--6658},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/wang19o.html},
  timestamp    = {Tue, 11 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/WangZXS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/TrottZXS19,
  author       = {Alexander Trott and
                  Stephan Zheng and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Keeping Your Distance: Solving Sparse Reward Tasks Using Self-Balancing
                  Shaped Rewards},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {10376--10386},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/64c26b2a2dcf068c49894bd07e0e6389-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/TrottZXS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pldi/CampagnaXMSL19,
  author       = {Giovanni Campagna and
                  Silei Xu and
                  Mehrad Moradshahi and
                  Richard Socher and
                  Monica S. Lam},
  editor       = {Kathryn S. McKinley and
                  Kathleen Fisher},
  title        = {Genie: a generator of natural language semantic parsers for virtual
                  assistant commands},
  booktitle    = {Proceedings of the 40th {ACM} {SIGPLAN} Conference on Programming
                  Language Design and Implementation, {PLDI} 2019, Phoenix, AZ, USA,
                  June 22-26, 2019},
  pages        = {394--410},
  publisher    = {{ACM}},
  year         = {2019},
  url          = {https://doi.org/10.1145/3314221.3314594},
  doi          = {10.1145/3314221.3314594},
  timestamp    = {Sun, 09 Jun 2019 18:52:19 +0200},
  biburl       = {https://dblp.org/rec/conf/pldi/CampagnaXMSL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wmt/HashimotoBBMSX19,
  author       = {Kazuma Hashimoto and
                  Raffaella Buschiazzo and
                  James Bradbury and
                  Teresa Marshall and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Ondrej Bojar and
                  Rajen Chatterjee and
                  Christian Federmann and
                  Mark Fishel and
                  Yvette Graham and
                  Barry Haddow and
                  Matthias Huck and
                  Antonio Jimeno{-}Yepes and
                  Philipp Koehn and
                  Andr{\'{e}} Martins and
                  Christof Monz and
                  Matteo Negri and
                  Aur{\'{e}}lie N{\'{e}}v{\'{e}}ol and
                  Mariana L. Neves and
                  Matt Post and
                  Marco Turchi and
                  Karin Verspoor},
  title        = {A High-Quality Multilingual Dataset for Structured Documentation Translation},
  booktitle    = {Proceedings of the Fourth Conference on Machine Translation, {WMT}
                  2019, Florence, Italy, August 1-2, 2019 - Volume 1: Research Papers},
  pages        = {116--127},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/w19-5212},
  doi          = {10.18653/V1/W19-5212},
  timestamp    = {Thu, 17 Feb 2022 16:43:16 +0100},
  biburl       = {https://dblp.org/rec/conf/wmt/HashimotoBBMSX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-00603,
  author       = {Victor Zhong and
                  Caiming Xiong and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Coarse-grain Fine-grain Coattention Network for Multi-evidence Question
                  Answering},
  journal      = {CoRR},
  volume       = {abs/1901.00603},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.00603},
  eprinttype    = {arXiv},
  eprint       = {1901.00603},
  timestamp    = {Thu, 31 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-00603.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-03035,
  author       = {Chih{-}Yao Ma and
                  Jiasen Lu and
                  Zuxuan Wu and
                  Ghassan AlRegib and
                  Zsolt Kira and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Self-Monitoring Navigation Agent via Auxiliary Progress Estimation},
  journal      = {CoRR},
  volume       = {abs/1901.03035},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.03035},
  eprinttype    = {arXiv},
  eprint       = {1901.03035},
  timestamp    = {Fri, 01 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-03035.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-04713,
  author       = {Chien{-}Sheng Wu and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Global-to-local Memory Pointer Networks for Task-Oriented Dialogue},
  journal      = {CoRR},
  volume       = {abs/1901.04713},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.04713},
  eprinttype    = {arXiv},
  eprint       = {1901.04713},
  timestamp    = {Fri, 01 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-04713.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-00528,
  author       = {Hao Liu and
                  Alexander Trott and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Competitive Experience Replay},
  journal      = {CoRR},
  volume       = {abs/1902.00528},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.00528},
  eprinttype    = {arXiv},
  eprint       = {1902.00528},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-00528.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-09868,
  author       = {Mingfei Gao and
                  Mingze Xu and
                  Larry S. Davis and
                  Richard Socher and
                  Caiming Xiong},
  title        = {StartNet: Online Detection of Action Start in Untrimmed Videos},
  journal      = {CoRR},
  volume       = {abs/1903.09868},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.09868},
  eprinttype    = {arXiv},
  eprint       = {1903.09868},
  timestamp    = {Mon, 01 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-09868.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-00310,
  author       = {Xilai Li and
                  Yingbo Zhou and
                  Tianfu Wu and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Learn to Grow: {A} Continual Structure Learning Framework for Overcoming
                  Catastrophic Forgetting},
  journal      = {CoRR},
  volume       = {abs/1904.00310},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.00310},
  eprinttype    = {arXiv},
  eprint       = {1904.00310},
  timestamp    = {Wed, 13 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-00310.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-09020,
  author       = {Giovanni Campagna and
                  Silei Xu and
                  Mehrad Moradshahi and
                  Richard Socher and
                  Monica S. Lam},
  title        = {Genie: {A} Generator of Natural Language Semantic Parsers for Virtual
                  Assistant Commands},
  journal      = {CoRR},
  volume       = {abs/1904.09020},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.09020},
  eprinttype    = {arXiv},
  eprint       = {1904.09020},
  timestamp    = {Fri, 26 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-09020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-09286,
  author       = {Nitish Shirish Keskar and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Unifying Question Answering and Text Classification via Span Extraction},
  journal      = {CoRR},
  volume       = {abs/1904.09286},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.09286},
  eprinttype    = {arXiv},
  eprint       = {1904.09286},
  timestamp    = {Fri, 26 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-09286.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-08743,
  author       = {Chien{-}Sheng Wu and
                  Andrea Madotto and
                  Ehsan Hosseini{-}Asl and
                  Caiming Xiong and
                  Richard Socher and
                  Pascale Fung},
  title        = {Transferable Multi-Domain State Generator for Task-Oriented Dialogue
                  Systems},
  journal      = {CoRR},
  volume       = {abs/1905.08743},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.08743},
  eprinttype    = {arXiv},
  eprint       = {1905.08743},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-08743.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-11471,
  author       = {Jasdeep Singh and
                  Bryan McCann and
                  Nitish Shirish Keskar and
                  Caiming Xiong and
                  Richard Socher},
  title        = {{XLDA:} Cross-Lingual Data Augmentation for Natural Language Inference
                  and Question Answering},
  journal      = {CoRR},
  volume       = {abs/1905.11471},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.11471},
  eprinttype    = {arXiv},
  eprint       = {1905.11471},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-11471.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-12654,
  author       = {Huan Wang and
                  Stephan Zheng and
                  Caiming Xiong and
                  Richard Socher},
  title        = {On the Generalization Gap in Reparameterizable Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1905.12654},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.12654},
  eprinttype    = {arXiv},
  eprint       = {1905.12654},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-12654.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-02285,
  author       = {Tao Yu and
                  Rui Zhang and
                  Michihiro Yasunaga and
                  Yi Chern Tan and
                  Xi Victoria Lin and
                  Suyi Li and
                  Heyang Er and
                  Irene Li and
                  Bo Pang and
                  Tao Chen and
                  Emily Ji and
                  Shreya Dixit and
                  David Proctor and
                  Sungrok Shim and
                  Jonathan Kraft and
                  Vincent Zhang and
                  Caiming Xiong and
                  Richard Socher and
                  Dragomir R. Radev},
  title        = {SParC: Cross-Domain Semantic Parsing in Context},
  journal      = {CoRR},
  volume       = {abs/1906.02285},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.02285},
  eprinttype    = {arXiv},
  eprint       = {1906.02285},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-02285.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-02361,
  author       = {Nazneen Fatema Rajani and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Explain Yourself! Leveraging Language Models for Commonsense Reasoning},
  journal      = {CoRR},
  volume       = {abs/1906.02361},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.02361},
  eprinttype    = {arXiv},
  eprint       = {1906.02361},
  timestamp    = {Thu, 13 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-02361.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-00664,
  author       = {Wenling Shang and
                  Alexander Trott and
                  Stephan Zheng and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Learning World Graphs to Accelerate Hierarchical Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1907.00664},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.00664},
  eprinttype    = {arXiv},
  eprint       = {1907.00664},
  timestamp    = {Mon, 08 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-00664.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-08960,
  author       = {Wojciech Kryscinski and
                  Nitish Shirish Keskar and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Neural Text Summarization: {A} Critical Evaluation},
  journal      = {CoRR},
  volume       = {abs/1908.08960},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.08960},
  eprinttype    = {arXiv},
  eprint       = {1908.08960},
  timestamp    = {Thu, 29 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-08960.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-00239,
  author       = {Mingfei Gao and
                  Larry S. Davis and
                  Richard Socher and
                  Caiming Xiong},
  title        = {{WSLLN:} Weakly Supervised Natural Language Localization Networks},
  journal      = {CoRR},
  volume       = {abs/1909.00239},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.00239},
  eprinttype    = {arXiv},
  eprint       = {1909.00239},
  timestamp    = {Mon, 16 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-00239.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-00786,
  author       = {Rui Zhang and
                  Tao Yu and
                  Heyang Er and
                  Sungrok Shim and
                  Eric Xue and
                  Xi Victoria Lin and
                  Tianze Shi and
                  Caiming Xiong and
                  Richard Socher and
                  Dragomir R. Radev},
  title        = {Editing-Based {SQL} Query Generation for Cross-Domain Context-Dependent
                  Questions},
  journal      = {CoRR},
  volume       = {abs/1909.00786},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.00786},
  eprinttype    = {arXiv},
  eprint       = {1909.00786},
  timestamp    = {Thu, 19 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-00786.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-03223,
  author       = {Tong Niu and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Deleter: Leveraging {BERT} to Perform Unsupervised Successive Text
                  Compression},
  journal      = {CoRR},
  volume       = {abs/1909.03223},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.03223},
  eprinttype    = {arXiv},
  eprint       = {1909.03223},
  timestamp    = {Tue, 17 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-03223.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-03290,
  author       = {Lav R. Varshney and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Pretrained {AI} Models: Performativity, Mobility, and Change},
  journal      = {CoRR},
  volume       = {abs/1909.03290},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.03290},
  eprinttype    = {arXiv},
  eprint       = {1909.03290},
  timestamp    = {Tue, 17 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-03290.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-05378,
  author       = {Tao Yu and
                  Rui Zhang and
                  Heyang Er and
                  Suyi Li and
                  Eric Xue and
                  Bo Pang and
                  Xi Victoria Lin and
                  Yi Chern Tan and
                  Tianze Shi and
                  Zihan Li and
                  Youxuan Jiang and
                  Michihiro Yasunaga and
                  Sungrok Shim and
                  Tao Chen and
                  Alexander R. Fabbri and
                  Zifan Li and
                  Luyao Chen and
                  Yuwen Zhang and
                  Shreya Dixit and
                  Vincent Zhang and
                  Caiming Xiong and
                  Richard Socher and
                  Walter S. Lasecki and
                  Dragomir R. Radev},
  title        = {CoSQL: {A} Conversational Text-to-SQL Challenge Towards Cross-Domain
                  Natural Language Interfaces to Databases},
  journal      = {CoRR},
  volume       = {abs/1909.05378},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.05378},
  eprinttype    = {arXiv},
  eprint       = {1909.05378},
  timestamp    = {Thu, 19 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-05378.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-05858,
  author       = {Nitish Shirish Keskar and
                  Bryan McCann and
                  Lav R. Varshney and
                  Caiming Xiong and
                  Richard Socher},
  title        = {{CTRL:} {A} Conditional Transformer Language Model for Controllable
                  Generation},
  journal      = {CoRR},
  volume       = {abs/1909.05858},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.05858},
  eprinttype    = {arXiv},
  eprint       = {1909.05858},
  timestamp    = {Wed, 18 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-05858.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-00164,
  author       = {Devansh Arpit and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Entropy Penalty: Towards Generalization Beyond the {IID} Assumption},
  journal      = {CoRR},
  volume       = {abs/1910.00164},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.00164},
  eprinttype    = {arXiv},
  eprint       = {1910.00164},
  timestamp    = {Fri, 04 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-00164.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-03544,
  author       = {Jianguo Zhang and
                  Kazuma Hashimoto and
                  Chien{-}Sheng Wu and
                  Yao Wan and
                  Philip S. Yu and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Find or Classify? Dual Strategy for Slot-Value Predictions on Multi-Domain
                  Dialog State Tracking},
  journal      = {CoRR},
  volume       = {abs/1910.03544},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.03544},
  eprinttype    = {arXiv},
  eprint       = {1910.03544},
  timestamp    = {Tue, 13 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-03544.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-10245,
  author       = {Ryan Theisen and
                  Jason M. Klusowski and
                  Huan Wang and
                  Nitish Shirish Keskar and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Global Capacity Measures for Deep ReLU Networks via Path Sampling},
  journal      = {CoRR},
  volume       = {abs/1910.10245},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.10245},
  eprinttype    = {arXiv},
  eprint       = {1910.10245},
  timestamp    = {Fri, 25 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-10245.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-12840,
  author       = {Wojciech Kryscinski and
                  Bryan McCann and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Evaluating the Factual Consistency of Abstractive Text Summarization},
  journal      = {CoRR},
  volume       = {abs/1910.12840},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.12840},
  eprinttype    = {arXiv},
  eprint       = {1910.12840},
  timestamp    = {Thu, 31 Oct 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-12840.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-13008,
  author       = {Michael Shum and
                  Stephan Zheng and
                  Wojciech Kryscinski and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Sketch-Fill-A-R: {A} Persona-Grounded Chit-Chat Generation Framework},
  journal      = {CoRR},
  volume       = {abs/1910.13008},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.13008},
  eprinttype    = {arXiv},
  eprint       = {1910.13008},
  timestamp    = {Thu, 31 Oct 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-13008.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-01417,
  author       = {Alexander Trott and
                  Stephan Zheng and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Keeping Your Distance: Solving Sparse Reward Tasks Using Self-Balancing
                  Shaped Rewards},
  journal      = {CoRR},
  volume       = {abs/1911.01417},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.01417},
  eprinttype    = {arXiv},
  eprint       = {1911.01417},
  timestamp    = {Mon, 11 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-01417.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-03429,
  author       = {Jay DeYoung and
                  Sarthak Jain and
                  Nazneen Fatema Rajani and
                  Eric Lehman and
                  Caiming Xiong and
                  Richard Socher and
                  Byron C. Wallace},
  title        = {{ERASER:} {A} Benchmark to Evaluate Rationalized {NLP} Models},
  journal      = {CoRR},
  volume       = {abs/1911.03429},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.03429},
  eprinttype    = {arXiv},
  eprint       = {1911.03429},
  timestamp    = {Mon, 11 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-03429.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-03588,
  author       = {Linqing Liu and
                  Huan Wang and
                  Jimmy Lin and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Attentive Student Meets Multi-Task Teacher: Improved Knowledge Distillation
                  for Pretrained Models},
  journal      = {CoRR},
  volume       = {abs/1911.03588},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.03588},
  eprinttype    = {arXiv},
  eprint       = {1911.03588},
  timestamp    = {Sun, 01 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-03588.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-10470,
  author       = {Akari Asai and
                  Kazuma Hashimoto and
                  Hannaneh Hajishirzi and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Learning to Retrieve Reasoning Paths over Wikipedia Graph for Question
                  Answering},
  journal      = {CoRR},
  volume       = {abs/1911.10470},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.10470},
  eprinttype    = {arXiv},
  eprint       = {1911.10470},
  timestamp    = {Tue, 03 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-10470.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-05086,
  author       = {Hengduo Li and
                  Zuxuan Wu and
                  Chen Zhu and
                  Caiming Xiong and
                  Richard Socher and
                  Larry S. Davis},
  title        = {Learning from Noisy Anchors for One-stage Object Detection},
  journal      = {CoRR},
  volume       = {abs/1912.05086},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.05086},
  eprinttype    = {arXiv},
  eprint       = {1912.05086},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-05086.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SocherZX18,
  author       = {Victor Zhong and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Iryna Gurevych and
                  Yusuke Miyao},
  title        = {Global-Locally Self-Attentive Encoder for Dialogue State Tracking},
  booktitle    = {Proceedings of the 56th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
                  1: Long Papers},
  pages        = {1458--1467},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-1135/},
  doi          = {10.18653/V1/P18-1135},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SocherZX18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SocherZXM18,
  author       = {Sewon Min and
                  Victor Zhong and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Iryna Gurevych and
                  Yusuke Miyao},
  title        = {Efficient and Robust Question Answering from Minimal Context over
                  Documents},
  booktitle    = {Proceedings of the 56th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
                  1: Long Papers},
  pages        = {1725--1735},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-1160/},
  doi          = {10.18653/V1/P18-1160},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SocherZXM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/ZhouZCSX18,
  author       = {Luowei Zhou and
                  Yingbo Zhou and
                  Jason J. Corso and
                  Richard Socher and
                  Caiming Xiong},
  title        = {End-to-End Dense Video Captioning With Masked Transformer},
  booktitle    = {2018 {IEEE} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2018, Salt Lake City, UT, USA, June 18-22, 2018},
  pages        = {8739--8748},
  publisher    = {Computer Vision Foundation / {IEEE} Computer Society},
  year         = {2018},
  url          = {http://openaccess.thecvf.com/content\_cvpr\_2018/html/Zhou\_End-to-End\_Dense\_Video\_CVPR\_2018\_paper.html},
  doi          = {10.1109/CVPR.2018.00911},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/ZhouZCSX18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/KryscinskiPXS18,
  author       = {Wojciech Kryscinski and
                  Romain Paulus and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Improving Abstraction in Text Summarization},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {1808--1817},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1207},
  doi          = {10.18653/V1/D18-1207},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/KryscinskiPXS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/LinSX18,
  author       = {Xi Victoria Lin and
                  Richard Socher and
                  Caiming Xiong},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Multi-Hop Knowledge Graph Reasoning with Reward Shaping},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {3243--3253},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1362},
  doi          = {10.18653/V1/D18-1362},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/LinSX18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ZhouXS18,
  author       = {Yingbo Zhou and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Improving End-to-End Speech Recognition with Policy Learning},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5819--5823},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462361},
  doi          = {10.1109/ICASSP.2018.8462361},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ZhouXS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Gu0XLS18,
  author       = {Jiatao Gu and
                  James Bradbury and
                  Caiming Xiong and
                  Victor O. K. Li and
                  Richard Socher},
  title        = {Non-Autoregressive Neural Machine Translation},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=B1l8BtlCb},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Gu0XLS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MerityKS18,
  author       = {Stephen Merity and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Regularizing and Optimizing {LSTM} Language Models},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=SyyGPP0TZ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MerityKS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/PaulusXS18,
  author       = {Romain Paulus and
                  Caiming Xiong and
                  Richard Socher},
  title        = {A Deep Reinforced Model for Abstractive Summarization},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=HkAClQgA-},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/PaulusXS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SchrimpfM0S18,
  author       = {Martin Schrimpf and
                  Stephen Merity and
                  James Bradbury and
                  Richard Socher},
  title        = {A Flexible Approach to Automated {RNN} Architecture Generation},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=BJDCPSJPM},
  timestamp    = {Thu, 04 Apr 2019 13:20:09 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SchrimpfM0S18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ShuXS18,
  author       = {Tianmin Shu and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Hierarchical and Interpretable Skill Acquisition in Multi-task Reinforcement
                  Learning},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=SJJQVZW0b},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ShuXS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/TrottXS18,
  author       = {Alexander Trott and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Interpretable Counting for Visual Question Answering},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=S1J2ZyZ0Z},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/TrottXS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/XiongZS18,
  author       = {Caiming Xiong and
                  Victor Zhong and
                  Richard Socher},
  title        = {{DCN+:} Mixed Objective And Deep Residual Coattention for Question
                  Answering},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=H1meywxRW},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/XiongZS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Hosseini-AslZXS18,
  author       = {Ehsan Hosseini{-}Asl and
                  Yingbo Zhou and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {B. Yegnanarayana},
  title        = {A Multi-Discriminator CycleGAN for Unsupervised Non-Parallel Speech
                  Domain Adaptation},
  booktitle    = {Interspeech 2018, 19th Annual Conference of the International Speech
                  Communication Association, Hyderabad, India, 2-6 September 2018},
  pages        = {3758--3762},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1535},
  doi          = {10.21437/INTERSPEECH.2018-1535},
  timestamp    = {Fri, 21 May 2021 08:16:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Hosseini-AslZXS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1803-08240,
  author       = {Stephen Merity and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {An Analysis of Neural Language Modeling at Multiple Scales},
  journal      = {CoRR},
  volume       = {abs/1803.08240},
  year         = {2018},
  url          = {http://arxiv.org/abs/1803.08240},
  eprinttype    = {arXiv},
  eprint       = {1803.08240},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1803-08240.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-00522,
  author       = {Ehsan Hosseini{-}Asl and
                  Yingbo Zhou and
                  Caiming Xiong and
                  Richard Socher},
  title        = {A Multi-Discriminator CycleGAN for Unsupervised Non-Parallel Speech
                  Domain Adaptation},
  journal      = {CoRR},
  volume       = {abs/1804.00522},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.00522},
  eprinttype    = {arXiv},
  eprint       = {1804.00522},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-00522.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-00819,
  author       = {Luowei Zhou and
                  Yingbo Zhou and
                  Jason J. Corso and
                  Richard Socher and
                  Caiming Xiong},
  title        = {End-to-End Dense Video Captioning with Masked Transformer},
  journal      = {CoRR},
  volume       = {abs/1804.00819},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.00819},
  eprinttype    = {arXiv},
  eprint       = {1804.00819},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-00819.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-08092,
  author       = {Sewon Min and
                  Victor Zhong and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Efficient and Robust Question Answering from Minimal Context over
                  Documents},
  journal      = {CoRR},
  volume       = {abs/1805.08092},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.08092},
  eprinttype    = {arXiv},
  eprint       = {1805.08092},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-08092.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-09655,
  author       = {Victor Zhong and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Global-Locally Self-Attentive Dialogue State Tracker},
  journal      = {CoRR},
  volume       = {abs/1805.09655},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.09655},
  eprinttype    = {arXiv},
  eprint       = {1805.09655},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-09655.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-06977,
  author       = {Akhilesh Gotmare and
                  Nitish Shirish Keskar and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Using Mode Connectivity for Loss Landscape Analysis},
  journal      = {CoRR},
  volume       = {abs/1806.06977},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.06977},
  eprinttype    = {arXiv},
  eprint       = {1806.06977},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-06977.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-08730,
  author       = {Bryan McCann and
                  Nitish Shirish Keskar and
                  Caiming Xiong and
                  Richard Socher},
  title        = {The Natural Language Decathlon: Multitask Learning as Question Answering},
  journal      = {CoRR},
  volume       = {abs/1806.08730},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.08730},
  eprinttype    = {arXiv},
  eprint       = {1806.08730},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-08730.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-00374,
  author       = {Ehsan Hosseini{-}Asl and
                  Yingbo Zhou and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Augmented Cyclic Adversarial Learning for Domain Adaptation},
  journal      = {CoRR},
  volume       = {abs/1807.00374},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.00374},
  eprinttype    = {arXiv},
  eprint       = {1807.00374},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-00374.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-07913,
  author       = {Wojciech Kryscinski and
                  Romain Paulus and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Improving Abstraction in Text Summarization},
  journal      = {CoRR},
  volume       = {abs/1808.07913},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.07913},
  eprinttype    = {arXiv},
  eprint       = {1808.07913},
  timestamp    = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-07913.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-10568,
  author       = {Xi Victoria Lin and
                  Richard Socher and
                  Caiming Xiong},
  title        = {Multi-Hop Knowledge Graph Reasoning with Reward Shaping},
  journal      = {CoRR},
  volume       = {abs/1808.10568},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.10568},
  eprinttype    = {arXiv},
  eprint       = {1808.10568},
  timestamp    = {Mon, 03 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-10568.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-07402,
  author       = {Huan Wang and
                  Nitish Shirish Keskar and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Identifying Generalization Properties in Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1809.07402},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.07402},
  eprinttype    = {arXiv},
  eprint       = {1809.07402},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-07402.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-13243,
  author       = {Akhilesh Gotmare and
                  Nitish Shirish Keskar and
                  Caiming Xiong and
                  Richard Socher},
  title        = {A Closer Look at Deep Learning Heuristics: Learning rate restarts,
                  Warmup and Distillation},
  journal      = {CoRR},
  volume       = {abs/1810.13243},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.13243},
  eprinttype    = {arXiv},
  eprint       = {1810.13243},
  timestamp    = {Thu, 08 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-13243.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-12432,
  author       = {Zuxuan Wu and
                  Caiming Xiong and
                  Chih{-}Yao Ma and
                  Richard Socher and
                  Larry S. Davis},
  title        = {AdaFrame: Adaptive Frame Selection for Fast Video Recognition},
  journal      = {CoRR},
  volume       = {abs/1811.12432},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.12432},
  eprinttype    = {arXiv},
  eprint       = {1811.12432},
  timestamp    = {Mon, 03 Dec 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-12432.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/LuXPS17,
  author       = {Jiasen Lu and
                  Caiming Xiong and
                  Devi Parikh and
                  Richard Socher},
  title        = {Knowing When to Look: Adaptive Attention via a Visual Sentinel for
                  Image Captioning},
  booktitle    = {2017 {IEEE} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2017, Honolulu, HI, USA, July 21-26, 2017},
  pages        = {3242--3250},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/CVPR.2017.345},
  doi          = {10.1109/CVPR.2017.345},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/LuXPS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/BradburyS17,
  author       = {James Bradbury and
                  Richard Socher},
  editor       = {Kai{-}Wei Chang and
                  Ming{-}Wei Chang and
                  Vivek Srikumar and
                  Alexander M. Rush},
  title        = {Towards Neural Machine Translation with Latent Tree Attention},
  booktitle    = {Proceedings of the 2nd Workshop on Structured Prediction for Natural
                  Language Processing, SPNLP@EMNLP, Copenhagen, Denmark, September 2017},
  pages        = {12--16},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/w17-4303},
  doi          = {10.18653/V1/W17-4303},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/BradburyS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/HashimotoXTS17,
  author       = {Kazuma Hashimoto and
                  Caiming Xiong and
                  Yoshimasa Tsuruoka and
                  Richard Socher},
  editor       = {Martha Palmer and
                  Rebecca Hwa and
                  Sebastian Riedel},
  title        = {A Joint Many-Task Model: Growing a Neural Network for Multiple {NLP}
                  Tasks},
  booktitle    = {Proceedings of the 2017 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2017, Copenhagen, Denmark, September
                  9-11, 2017},
  pages        = {1923--1933},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/d17-1206},
  doi          = {10.18653/V1/D17-1206},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/HashimotoXTS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/0002MXS17,
  author       = {James Bradbury and
                  Stephen Merity and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Quasi-Recurrent Neural Networks},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=H1zJ-v5xl},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/0002MXS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/InanKS17,
  author       = {Hakan Inan and
                  Khashayar Khosravi and
                  Richard Socher},
  title        = {Tying Word Vectors and Word Classifiers: {A} Loss Framework for Language
                  Modeling},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=r1aPbsFle},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/InanKS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MerityX0S17,
  author       = {Stephen Merity and
                  Caiming Xiong and
                  James Bradbury and
                  Richard Socher},
  title        = {Pointer Sentinel Mixture Models},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=Byj72udxe},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MerityX0S17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/XiongZS17,
  author       = {Caiming Xiong and
                  Victor Zhong and
                  Richard Socher},
  title        = {Dynamic Coattention Networks For Question Answering},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=rJeKjwvclx},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/XiongZS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/McCannBXS17,
  author       = {Bryan McCann and
                  James Bradbury and
                  Caiming Xiong and
                  Richard Socher},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Learned in Translation: Contextualized Word Vectors},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {6294--6305},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/20c86a628232a67e7bd46f76fba7ce12-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 13:58:27 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/McCannBXS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rep4nlp/JohansenS17,
  author       = {Alexander Rosenberg Johansen and
                  Richard Socher},
  editor       = {Phil Blunsom and
                  Antoine Bordes and
                  Kyunghyun Cho and
                  Shay B. Cohen and
                  Chris Dyer and
                  Edward Grefenstette and
                  Karl Moritz Hermann and
                  Laura Rimell and
                  Jason Weston and
                  Scott Yih},
  title        = {Learning when to skim and when to read},
  booktitle    = {Proceedings of the 2nd Workshop on Representation Learning for NLP,
                  Rep4NLP@ACL 2017, Vancouver, Canada, August 3, 2017},
  pages        = {257--264},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/w17-2631},
  doi          = {10.18653/V1/W17-2631},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/rep4nlp/JohansenS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PaulusXS17,
  author       = {Romain Paulus and
                  Caiming Xiong and
                  Richard Socher},
  title        = {A Deep Reinforced Model for Abstractive Summarization},
  journal      = {CoRR},
  volume       = {abs/1705.04304},
  year         = {2017},
  url          = {http://arxiv.org/abs/1705.04304},
  eprinttype    = {arXiv},
  eprint       = {1705.04304},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PaulusXS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-00107,
  author       = {Bryan McCann and
                  James Bradbury and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Learned in Translation: Contextualized Word Vectors},
  journal      = {CoRR},
  volume       = {abs/1708.00107},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.00107},
  eprinttype    = {arXiv},
  eprint       = {1708.00107},
  timestamp    = {Thu, 21 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-00107.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-01009,
  author       = {Stephen Merity and
                  Bryan McCann and
                  Richard Socher},
  title        = {Revisiting Activation Regularization for Language RNNs},
  journal      = {CoRR},
  volume       = {abs/1708.01009},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.01009},
  eprinttype    = {arXiv},
  eprint       = {1708.01009},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-01009.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-02182,
  author       = {Stephen Merity and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Regularizing and Optimizing {LSTM} Language Models},
  journal      = {CoRR},
  volume       = {abs/1708.02182},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.02182},
  eprinttype    = {arXiv},
  eprint       = {1708.02182},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-02182.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-00103,
  author       = {Victor Zhong and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Seq2SQL: Generating Structured Queries from Natural Language using
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1709.00103},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.00103},
  eprinttype    = {arXiv},
  eprint       = {1709.00103},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-00103.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-01915,
  author       = {James Bradbury and
                  Richard Socher},
  title        = {Towards Neural Machine Translation with Latent Tree Attention},
  journal      = {CoRR},
  volume       = {abs/1709.01915},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.01915},
  eprinttype    = {arXiv},
  eprint       = {1709.01915},
  timestamp    = {Thu, 21 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-01915.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-00106,
  author       = {Caiming Xiong and
                  Victor Zhong and
                  Richard Socher},
  title        = {{DCN+:} Mixed Objective and Deep Residual Coattention for Question
                  Answering},
  journal      = {CoRR},
  volume       = {abs/1711.00106},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.00106},
  eprinttype    = {arXiv},
  eprint       = {1711.00106},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-00106.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-02132,
  author       = {Karim Ahmed and
                  Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Weighted Transformer Network for Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1711.02132},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.02132},
  eprinttype    = {arXiv},
  eprint       = {1711.02132},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-02132.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-02281,
  author       = {Jiatao Gu and
                  James Bradbury and
                  Caiming Xiong and
                  Victor O. K. Li and
                  Richard Socher},
  title        = {Non-Autoregressive Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1711.02281},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.02281},
  eprinttype    = {arXiv},
  eprint       = {1711.02281},
  timestamp    = {Thu, 21 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-02281.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-05483,
  author       = {Alexander Rosenberg Johansen and
                  Richard Socher},
  title        = {Learning when to skim and when to read},
  journal      = {CoRR},
  volume       = {abs/1712.05483},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.05483},
  eprinttype    = {arXiv},
  eprint       = {1712.05483},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-05483.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-07101,
  author       = {Yingbo Zhou and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Improving End-to-End Speech Recognition with Policy Learning},
  journal      = {CoRR},
  volume       = {abs/1712.07101},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.07101},
  eprinttype    = {arXiv},
  eprint       = {1712.07101},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-07101.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-07108,
  author       = {Yingbo Zhou and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Improved Regularization Techniques for End-to-End Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1712.07108},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.07108},
  eprinttype    = {arXiv},
  eprint       = {1712.07108},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-07108.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-07294,
  author       = {Tianmin Shu and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Hierarchical and Interpretable Skill Acquisition in Multi-task Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1712.07294},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.07294},
  eprinttype    = {arXiv},
  eprint       = {1712.07294},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-07294.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-07296,
  author       = {Huishuai Zhang and
                  Caiming Xiong and
                  James Bradbury and
                  Richard Socher},
  title        = {Block-diagonal Hessian-free Optimization for Training Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1712.07296},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.07296},
  eprinttype    = {arXiv},
  eprint       = {1712.07296},
  timestamp    = {Thu, 21 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-07296.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-07316,
  author       = {Martin Schrimpf and
                  Stephen Merity and
                  James Bradbury and
                  Richard Socher},
  title        = {A Flexible Approach to Automated {RNN} Architecture Generation},
  journal      = {CoRR},
  volume       = {abs/1712.07316},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.07316},
  eprinttype    = {arXiv},
  eprint       = {1712.07316},
  timestamp    = {Thu, 21 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-07316.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-07628,
  author       = {Nitish Shirish Keskar and
                  Richard Socher},
  title        = {Improving Generalization Performance by Switching from Adam to {SGD}},
  journal      = {CoRR},
  volume       = {abs/1712.07628},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.07628},
  eprinttype    = {arXiv},
  eprint       = {1712.07628},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-07628.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-08697,
  author       = {Alexander Trott and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Interpretable Counting for Visual Question Answering},
  journal      = {CoRR},
  volume       = {abs/1712.08697},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.08697},
  eprinttype    = {arXiv},
  eprint       = {1712.08697},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-08697.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KumarIOIBGZPS16,
  author       = {Ankit Kumar and
                  Ozan Irsoy and
                  Peter Ondruska and
                  Mohit Iyyer and
                  James Bradbury and
                  Ishaan Gulrajani and
                  Victor Zhong and
                  Romain Paulus and
                  Richard Socher},
  editor       = {Maria{-}Florina Balcan and
                  Kilian Q. Weinberger},
  title        = {Ask Me Anything: Dynamic Memory Networks for Natural Language Processing},
  booktitle    = {Proceedings of the 33nd International Conference on Machine Learning,
                  {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {48},
  pages        = {1378--1387},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v48/kumar16.html},
  timestamp    = {Wed, 29 May 2019 08:41:46 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KumarIOIBGZPS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/XiongMS16,
  author       = {Caiming Xiong and
                  Stephen Merity and
                  Richard Socher},
  editor       = {Maria{-}Florina Balcan and
                  Kilian Q. Weinberger},
  title        = {Dynamic Memory Networks for Visual and Textual Question Answering},
  booktitle    = {Proceedings of the 33nd International Conference on Machine Learning,
                  {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {48},
  pages        = {2397--2406},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v48/xiong16.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/XiongMS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wassa/Socher16,
  author       = {Richard Socher},
  editor       = {Alexandra Balahur and
                  Erik Van der Goot and
                  Piek Vossen and
                  Andr{\'{e}}s Montoyo},
  title        = {Deep Learning for Sentiment Analysis - Invited Talk},
  booktitle    = {Proceedings of the 7th Workshop on Computational Approaches to Subjectivity,
                  Sentiment and Social Media Analysis, WASSA@NAACL-HLT 2016, June 16,
                  2016, San Diego, California, {USA}},
  pages        = {36},
  publisher    = {The Association for Computer Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/w16-0408},
  doi          = {10.18653/V1/W16-0408},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/wassa/Socher16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wmt/BradburyS16,
  author       = {James Bradbury and
                  Richard Socher},
  title        = {MetaMind Neural Machine Translation System for {WMT} 2016},
  booktitle    = {Proceedings of the First Conference on Machine Translation, {WMT}
                  2016, colocated with {ACL} 2016, August 11-12, Berlin, Germany},
  pages        = {264--267},
  publisher    = {The Association for Computer Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/w16-2308},
  doi          = {10.18653/V1/W16-2308},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/wmt/BradburyS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/XiongMS16,
  author       = {Caiming Xiong and
                  Stephen Merity and
                  Richard Socher},
  title        = {Dynamic Memory Networks for Visual and Textual Question Answering},
  journal      = {CoRR},
  volume       = {abs/1603.01417},
  year         = {2016},
  url          = {http://arxiv.org/abs/1603.01417},
  eprinttype    = {arXiv},
  eprint       = {1603.01417},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/XiongMS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MerityXBS16,
  author       = {Stephen Merity and
                  Caiming Xiong and
                  James Bradbury and
                  Richard Socher},
  title        = {Pointer Sentinel Mixture Models},
  journal      = {CoRR},
  volume       = {abs/1609.07843},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.07843},
  eprinttype    = {arXiv},
  eprint       = {1609.07843},
  timestamp    = {Thu, 21 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/MerityXBS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/InanKS16,
  author       = {Hakan Inan and
                  Khashayar Khosravi and
                  Richard Socher},
  title        = {Tying Word Vectors and Word Classifiers: {A} Loss Framework for Language
                  Modeling},
  journal      = {CoRR},
  volume       = {abs/1611.01462},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.01462},
  eprinttype    = {arXiv},
  eprint       = {1611.01462},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/InanKS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BradburyMXS16,
  author       = {James Bradbury and
                  Stephen Merity and
                  Caiming Xiong and
                  Richard Socher},
  title        = {Quasi-Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1611.01576},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.01576},
  eprinttype    = {arXiv},
  eprint       = {1611.01576},
  timestamp    = {Thu, 21 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/BradburyMXS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HashimotoXTS16,
  author       = {Kazuma Hashimoto and
                  Caiming Xiong and
                  Yoshimasa Tsuruoka and
                  Richard Socher},
  title        = {A Joint Many-Task Model: Growing a Neural Network for Multiple {NLP}
                  Tasks},
  journal      = {CoRR},
  volume       = {abs/1611.01587},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.01587},
  eprinttype    = {arXiv},
  eprint       = {1611.01587},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HashimotoXTS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/XiongZS16,
  author       = {Caiming Xiong and
                  Victor Zhong and
                  Richard Socher},
  title        = {Dynamic Coattention Networks For Question Answering},
  journal      = {CoRR},
  volume       = {abs/1611.01604},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.01604},
  eprinttype    = {arXiv},
  eprint       = {1611.01604},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/XiongZS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LongprePXS16,
  author       = {Shayne Longpre and
                  Sabeek Pradhan and
                  Caiming Xiong and
                  Richard Socher},
  title        = {A Way out of the Odyssey: Analyzing and Combining Recent Insights
                  for LSTMs},
  journal      = {CoRR},
  volume       = {abs/1611.05104},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.05104},
  eprinttype    = {arXiv},
  eprint       = {1611.05104},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LongprePXS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LuXPS16,
  author       = {Jiasen Lu and
                  Caiming Xiong and
                  Devi Parikh and
                  Richard Socher},
  title        = {Knowing When to Look: Adaptive Attention via {A} Visual Sentinel for
                  Image Captioning},
  journal      = {CoRR},
  volume       = {abs/1612.01887},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.01887},
  eprinttype    = {arXiv},
  eprint       = {1612.01887},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LuXPS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/TaiSM15,
  author       = {Kai Sheng Tai and
                  Richard Socher and
                  Christopher D. Manning},
  title        = {Improved Semantic Representations From Tree-Structured Long Short-Term
                  Memory Networks},
  booktitle    = {Proceedings of the 53rd Annual Meeting of the Association for Computational
                  Linguistics and the 7th International Joint Conference on Natural
                  Language Processing of the Asian Federation of Natural Language Processing,
                  {ACL} 2015, July 26-31, 2015, Beijing, China, Volume 1: Long Papers},
  pages        = {1556--1566},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.3115/v1/p15-1150},
  doi          = {10.3115/V1/P15-1150},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/TaiSM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TaiSM15,
  author       = {Kai Sheng Tai and
                  Richard Socher and
                  Christopher D. Manning},
  title        = {Improved Semantic Representations From Tree-Structured Long Short-Term
                  Memory Networks},
  journal      = {CoRR},
  volume       = {abs/1503.00075},
  year         = {2015},
  url          = {http://arxiv.org/abs/1503.00075},
  eprinttype    = {arXiv},
  eprint       = {1503.00075},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TaiSM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KumarISBEPOGS15,
  author       = {Ankit Kumar and
                  Ozan Irsoy and
                  Jonathan Su and
                  James Bradbury and
                  Robert English and
                  Brian Pierce and
                  Peter Ondruska and
                  Ishaan Gulrajani and
                  Richard Socher},
  title        = {Ask Me Anything: Dynamic Memory Networks for Natural Language Processing},
  journal      = {CoRR},
  volume       = {abs/1506.07285},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.07285},
  eprinttype    = {arXiv},
  eprint       = {1506.07285},
  timestamp    = {Thu, 21 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/KumarISBEPOGS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@phdthesis{DBLP:phd/us/Socher14,
  author       = {Richard Socher},
  title        = {Recursive deep learning for natural language processing and computer
                  vision},
  school       = {Stanford University, {USA}},
  year         = {2014},
  url          = {https://searchworks.stanford.edu/view/10608081},
  timestamp    = {Fri, 02 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/phd/us/Socher14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tacl/SocherKLMN14,
  author       = {Richard Socher and
                  Andrej Karpathy and
                  Quoc V. Le and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  title        = {Grounded Compositional Semantics for Finding and Describing Images
                  with Sentences},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {2},
  pages        = {207--218},
  year         = {2014},
  url          = {https://doi.org/10.1162/tacl\_a\_00177},
  doi          = {10.1162/TACL\_A\_00177},
  timestamp    = {Fri, 10 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/SocherKLMN14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/IyyerBCSD14,
  author       = {Mohit Iyyer and
                  Jordan L. Boyd{-}Graber and
                  Leonardo Max Batista Claudino and
                  Richard Socher and
                  Hal Daum{\'{e}} III},
  editor       = {Alessandro Moschitti and
                  Bo Pang and
                  Walter Daelemans},
  title        = {A Neural Network for Factoid Question Answering over Paragraphs},
  booktitle    = {Proceedings of the 2014 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2014, October 25-29, 2014, Doha, Qatar,
                  {A} meeting of SIGDAT, a Special Interest Group of the {ACL}},
  pages        = {633--644},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/d14-1070},
  doi          = {10.3115/V1/D14-1070},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/IyyerBCSD14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/PenningtonSM14,
  author       = {Jeffrey Pennington and
                  Richard Socher and
                  Christopher D. Manning},
  editor       = {Alessandro Moschitti and
                  Bo Pang and
                  Walter Daelemans},
  title        = {Glove: Global Vectors for Word Representation},
  booktitle    = {Proceedings of the 2014 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2014, October 25-29, 2014, Doha, Qatar,
                  {A} meeting of SIGDAT, a Special Interest Group of the {ACL}},
  pages        = {1532--1543},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/d14-1162},
  doi          = {10.3115/V1/D14-1162},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/PenningtonSM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lats/KulkarniSBK14,
  author       = {Chinmay Eishan Kulkarni and
                  Richard Socher and
                  Michael S. Bernstein and
                  Scott R. Klemmer},
  editor       = {Mehran Sahami and
                  Armando Fox and
                  Marti A. Hearst and
                  Michelene T. H. Chi},
  title        = {Scaling short-answer grading by combining peer assessment with algorithmic
                  scoring},
  booktitle    = {First {(2014)} {ACM} Conference on Learning @ Scale, L@S 2014, Atlanta,
                  GA, USA, March 4-5, 2014},
  pages        = {99--108},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2556325.2566238},
  doi          = {10.1145/2556325.2566238},
  timestamp    = {Sat, 24 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/lats/KulkarniSBK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PaulusSM14,
  author       = {Romain Paulus and
                  Richard Socher and
                  Christopher D. Manning},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {Global Belief Recursive Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {2888--2896},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/1415db70fe9ddb119e23e9b2808cde38-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/PaulusSM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SocherBMN13,
  author       = {Richard Socher and
                  John Bauer and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  title        = {Parsing with Compositional Vector Grammars},
  booktitle    = {Proceedings of the 51st Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2013, 4-9 August 2013, Sofia, Bulgaria, Volume
                  1: Long Papers},
  pages        = {455--465},
  publisher    = {The Association for Computer Linguistics},
  year         = {2013},
  url          = {https://aclanthology.org/P13-1045/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SocherBMN13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/conll/LuongSM13,
  author       = {Thang Luong and
                  Richard Socher and
                  Christopher D. Manning},
  editor       = {Julia Hockenmaier and
                  Sebastian Riedel},
  title        = {Better Word Representations with Recursive Neural Networks for Morphology},
  booktitle    = {Proceedings of the Seventeenth Conference on Computational Natural
                  Language Learning, CoNLL 2013, Sofia, Bulgaria, August 8-9, 2013},
  pages        = {104--113},
  publisher    = {{ACL}},
  year         = {2013},
  url          = {https://aclanthology.org/W13-3512/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/conll/LuongSM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZouSCM13,
  author       = {Will Y. Zou and
                  Richard Socher and
                  Daniel M. Cer and
                  Christopher D. Manning},
  title        = {Bilingual Word Embeddings for Phrase-Based Machine Translation},
  booktitle    = {Proceedings of the 2013 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2013, 18-21 October 2013, Grand Hyatt
                  Seattle, Seattle, Washington, USA, {A} meeting of SIGDAT, a Special
                  Interest Group of the {ACL}},
  pages        = {1393--1398},
  publisher    = {{ACL}},
  year         = {2013},
  url          = {https://aclanthology.org/D13-1141/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZouSCM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SocherPWCMNP13,
  author       = {Richard Socher and
                  Alex Perelygin and
                  Jean Wu and
                  Jason Chuang and
                  Christopher D. Manning and
                  Andrew Y. Ng and
                  Christopher Potts},
  title        = {Recursive Deep Models for Semantic Compositionality Over a Sentiment
                  Treebank},
  booktitle    = {Proceedings of the 2013 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2013, 18-21 October 2013, Grand Hyatt
                  Seattle, Seattle, Washington, USA, {A} meeting of SIGDAT, a Special
                  Interest Group of the {ACL}},
  pages        = {1631--1642},
  publisher    = {{ACL}},
  year         = {2013},
  url          = {https://aclanthology.org/D13-1170/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SocherPWCMNP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/SocherM13,
  author       = {Richard Socher and
                  Christopher D. Manning},
  editor       = {Lucy Vanderwende and
                  Hal Daum{\'{e}} III and
                  Katrin Kirchhoff},
  title        = {Deep Learning for {NLP} (without Magic)},
  booktitle    = {Human Language Technologies: Conference of the North American Chapter
                  of the Association of Computational Linguistics, Proceedings, June
                  9-14, 2013, Westin Peachtree Plaza Hotel, Atlanta, Georgia, {USA}},
  pages        = {1--3},
  publisher    = {The Association for Computational Linguistics},
  year         = {2013},
  url          = {https://aclanthology.org/N13-4001/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/SocherM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SocherCMN13,
  author       = {Richard Socher and
                  Danqi Chen and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  editor       = {Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Zoubin Ghahramani and
                  Kilian Q. Weinberger},
  title        = {Reasoning With Neural Tensor Networks for Knowledge Base Completion},
  booktitle    = {Advances in Neural Information Processing Systems 26: 27th Annual
                  Conference on Neural Information Processing Systems 2013. Proceedings
                  of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  pages        = {926--934},
  year         = {2013},
  url          = {https://proceedings.neurips.cc/paper/2013/hash/b337e84de8752b27eda3a12363109e80-Abstract.html},
  timestamp    = {Thu, 14 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SocherCMN13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SocherGMN13,
  author       = {Richard Socher and
                  Milind Ganjoo and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  editor       = {Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Zoubin Ghahramani and
                  Kilian Q. Weinberger},
  title        = {Zero-Shot Learning Through Cross-Modal Transfer},
  booktitle    = {Advances in Neural Information Processing Systems 26: 27th Annual
                  Conference on Neural Information Processing Systems 2013. Proceedings
                  of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  pages        = {935--943},
  year         = {2013},
  url          = {https://proceedings.neurips.cc/paper/2013/hash/2d6cc4b2d139a53512fb8cbb3086ae2e-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SocherGMN13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-3618,
  author       = {Danqi Chen and
                  Richard Socher and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Learning New Facts From Knowledge Bases With Neural Tensor Networks
                  and Semantic Word Vectors},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Workshop Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.3618},
  timestamp    = {Thu, 14 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-3618.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-3666,
  author       = {Richard Socher and
                  Milind Ganjoo and
                  Hamsa Sridhar and
                  Osbert Bastani and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Zero-Shot Learning Through Cross-Modal Transfer},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Workshop Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.3666},
  timestamp    = {Fri, 29 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-3666.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/acl/2013cvsm,
  editor       = {Alexandre Allauzen and
                  Hugo Larochelle and
                  Christopher D. Manning and
                  Richard Socher},
  title        = {Proceedings of the Workshop on Continuous Vector Space Models and
                  their Compositionality, CVSM@ACL 2013, Sofia, Bulgaria, August 9,
                  2013},
  publisher    = {Association for Computational Linguistics},
  year         = {2013},
  url          = {https://aclanthology.org/volumes/W13-32/},
  isbn         = {978-1-937284-67-1},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/2013cvsm.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SocherBM12,
  author       = {Richard Socher and
                  Yoshua Bengio and
                  Christopher D. Manning},
  title        = {Deep Learning for {NLP} (without Magic)},
  booktitle    = {The 50th Annual Meeting of the Association for Computational Linguistics,
                  Tutorial Abstracts, July 8, 2012, Jeju Island, Korea},
  pages        = {5},
  publisher    = {The Association for Computer Linguistics},
  year         = {2012},
  url          = {https://aclanthology.org/P12-4005/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SocherBM12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/HuangSMN12,
  author       = {Eric H. Huang and
                  Richard Socher and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  title        = {Improving Word Representations via Global Context and Multiple Word
                  Prototypes},
  booktitle    = {The 50th Annual Meeting of the Association for Computational Linguistics,
                  Proceedings of the Conference, July 8-14, 2012, Jeju Island, Korea
                  - Volume 1: Long Papers},
  pages        = {873--882},
  publisher    = {The Association for Computer Linguistics},
  year         = {2012},
  url          = {https://aclanthology.org/P12-1092/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/HuangSMN12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SocherHMN12,
  author       = {Richard Socher and
                  Brody Huval and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  editor       = {Jun'ichi Tsujii and
                  James Henderson and
                  Marius Pasca},
  title        = {Semantic Compositionality through Recursive Matrix-Vector Spaces},
  booktitle    = {Proceedings of the 2012 Joint Conference on Empirical Methods in Natural
                  Language Processing and Computational Natural Language Learning, EMNLP-CoNLL
                  2012, July 12-14, 2012, Jeju Island, Korea},
  pages        = {1201--1211},
  publisher    = {{ACL}},
  year         = {2012},
  url          = {https://aclanthology.org/D12-1110/},
  timestamp    = {Thu, 14 Apr 2022 16:28:48 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SocherHMN12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SocherHBMN12,
  author       = {Richard Socher and
                  Brody Huval and
                  Bharath Putta Bath and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  editor       = {Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Kilian Q. Weinberger},
  title        = {Convolutional-Recursive Deep Learning for 3D Object Classification},
  booktitle    = {Advances in Neural Information Processing Systems 25: 26th Annual
                  Conference on Neural Information Processing Systems 2012. Proceedings
                  of a meeting held December 3-6, 2012, Lake Tahoe, Nevada, United States},
  pages        = {665--673},
  year         = {2012},
  url          = {https://proceedings.neurips.cc/paper/2012/hash/3eae62bba9ddf64f69d49dc48e2dd214-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SocherHBMN12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/SocherPHNM11,
  author       = {Richard Socher and
                  Jeffrey Pennington and
                  Eric H. Huang and
                  Andrew Y. Ng and
                  Christopher D. Manning},
  title        = {Semi-Supervised Recursive Autoencoders for Predicting Sentiment Distributions},
  booktitle    = {Proceedings of the 2011 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2011, 27-31 July 2011, John McIntyre
                  Conference Centre, Edinburgh, UK, {A} meeting of SIGDAT, a Special
                  Interest Group of the {ACL}},
  pages        = {151--161},
  publisher    = {{ACL}},
  year         = {2011},
  url          = {https://aclanthology.org/D11-1014/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/SocherPHNM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/SocherLNM11,
  author       = {Richard Socher and
                  Cliff Chiung{-}Yu Lin and
                  Andrew Y. Ng and
                  Christopher D. Manning},
  editor       = {Lise Getoor and
                  Tobias Scheffer},
  title        = {Parsing Natural Scenes and Natural Language with Recursive Neural
                  Networks},
  booktitle    = {Proceedings of the 28th International Conference on Machine Learning,
                  {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011},
  pages        = {129--136},
  publisher    = {Omnipress},
  year         = {2011},
  url          = {https://icml.cc/2011/papers/125\_icmlpaper.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/SocherLNM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SocherHPNM11,
  author       = {Richard Socher and
                  Eric H. Huang and
                  Jeffrey Pennington and
                  Andrew Y. Ng and
                  Christopher D. Manning},
  editor       = {John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Kilian Q. Weinberger},
  title        = {Dynamic Pooling and Unfolding Recursive Autoencoders for Paraphrase
                  Detection},
  booktitle    = {Advances in Neural Information Processing Systems 24: 25th Annual
                  Conference on Neural Information Processing Systems 2011. Proceedings
                  of a meeting held 12-14 December 2011, Granada, Spain},
  pages        = {801--809},
  year         = {2011},
  url          = {https://proceedings.neurips.cc/paper/2011/hash/3335881e06d4d23091389226225e17c7-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SocherHPNM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/SocherMM11,
  author       = {Richard Socher and
                  Andrew L. Maas and
                  Christopher D. Manning},
  editor       = {Geoffrey J. Gordon and
                  David B. Dunson and
                  Miroslav Dud{\'{\i}}k},
  title        = {Spectral Chinese Restaurant Processes: Nonparametric Clustering Based
                  on Similarities},
  booktitle    = {Proceedings of the Fourteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2011, Fort Lauderdale, USA,
                  April 11-13, 2011},
  series       = {{JMLR} Proceedings},
  volume       = {15},
  pages        = {698--706},
  publisher    = {JMLR.org},
  year         = {2011},
  url          = {http://proceedings.mlr.press/v15/socher11a/socher11a.pdf},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/SocherMM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/Socher010,
  author       = {Richard Socher and
                  Li Fei{-}Fei},
  title        = {Connecting modalities: Semi-supervised segmentation and annotation
                  of images using unaligned text corpora},
  booktitle    = {The Twenty-Third {IEEE} Conference on Computer Vision and Pattern
                  Recognition, {CVPR} 2010, San Francisco, CA, USA, 13-18 June 2010},
  pages        = {966--973},
  publisher    = {{IEEE} Computer Society},
  year         = {2010},
  url          = {https://doi.org/10.1109/CVPR.2010.5540112},
  doi          = {10.1109/CVPR.2010.5540112},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/Socher010.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/DengDSLL009,
  author       = {Jia Deng and
                  Wei Dong and
                  Richard Socher and
                  Li{-}Jia Li and
                  Kai Li and
                  Li Fei{-}Fei},
  title        = {ImageNet: {A} large-scale hierarchical image database},
  booktitle    = {2009 {IEEE} Computer Society Conference on Computer Vision and Pattern
                  Recognition {(CVPR} 2009), 20-25 June 2009, Miami, Florida, {USA}},
  pages        = {248--255},
  publisher    = {{IEEE} Computer Society},
  year         = {2009},
  url          = {https://doi.org/10.1109/CVPR.2009.5206848},
  doi          = {10.1109/CVPR.2009.5206848},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/DengDSLL009.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/LiS009,
  author       = {Li{-}Jia Li and
                  Richard Socher and
                  Li Fei{-}Fei},
  title        = {Towards total scene understanding: Classification, annotation and
                  segmentation in an automatic framework},
  booktitle    = {2009 {IEEE} Computer Society Conference on Computer Vision and Pattern
                  Recognition {(CVPR} 2009), 20-25 June 2009, Miami, Florida, {USA}},
  pages        = {2036--2043},
  publisher    = {{IEEE} Computer Society},
  year         = {2009},
  url          = {https://doi.org/10.1109/CVPR.2009.5206718},
  doi          = {10.1109/CVPR.2009.5206718},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/LiS009.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SocherGPSBN09,
  author       = {Richard Socher and
                  Samuel Gershman and
                  Adler J. Perotte and
                  Per B. Sederberg and
                  David M. Blei and
                  Kenneth A. Norman},
  editor       = {Yoshua Bengio and
                  Dale Schuurmans and
                  John D. Lafferty and
                  Christopher K. I. Williams and
                  Aron Culotta},
  title        = {A Bayesian Analysis of Dynamics in Free Recall},
  booktitle    = {Advances in Neural Information Processing Systems 22: 23rd Annual
                  Conference on Neural Information Processing Systems 2009. Proceedings
                  of a meeting held 7-10 December 2009, Vancouver, British Columbia,
                  Canada},
  pages        = {1714--1722},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2009/hash/efe937780e95574250dabe07151bdc23-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SocherGPSBN09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isbi/SocherBC08,
  author       = {Richard Socher and
                  Adrian Barbu and
                  Dorin Comaniciu},
  title        = {A learning based hierarchical model for vessel segmentation},
  booktitle    = {Proceedings of the 2008 {IEEE} International Symposium on Biomedical
                  Imaging: From Nano to Macro, Paris, France, May 14-17, 2008},
  pages        = {1055--1058},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ISBI.2008.4541181},
  doi          = {10.1109/ISBI.2008.4541181},
  timestamp    = {Wed, 04 Oct 2023 17:01:25 +0200},
  biburl       = {https://dblp.org/rec/conf/isbi/SocherBC08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nodalida/SocherBO07,
  author       = {Richard Socher and
                  Chris Biemann and
                  Rainer Osswald},
  editor       = {Joakim Nivre and
                  Heiki{-}Jaan Kaalep and
                  Kadri Muischnek and
                  Mare Koit},
  title        = {Combining Contexts in Lexicon Learning for Semantic Parsing},
  booktitle    = {Proceedings of the 16th Nordic Conference of Computational Linguistics,
                  {NODALIDA} 2007, Tartu, Estonia, May 2007},
  pages        = {175--182},
  publisher    = {University of Tartu, Estonia},
  year         = {2007},
  url          = {https://aclanthology.org/W07-2425/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nodalida/SocherBO07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics