default search action
BibTeX records: Long Ouyang
@inproceedings{DBLP:conf/nips/Ouyang0JAWMZASR22, author = {Long Ouyang and Jeffrey Wu and Xu Jiang and Diogo Almeida and Carroll L. Wainwright and Pamela Mishkin and Chong Zhang and Sandhini Agarwal and Katarina Slama and Alex Ray and John Schulman and Jacob Hilton and Fraser Kelton and Luke Miller and Maddie Simens and Amanda Askell and Peter Welinder and Paul F. Christiano and Jan Leike and Ryan Lowe}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Training language models to follow instructions with human feedback}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/b1efde53be364a73914f58805a001731-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/Ouyang0JAWMZASR22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-02155, author = {Long Ouyang and Jeff Wu and Xu Jiang and Diogo Almeida and Carroll L. Wainwright and Pamela Mishkin and Chong Zhang and Sandhini Agarwal and Katarina Slama and Alex Ray and John Schulman and Jacob Hilton and Fraser Kelton and Luke Miller and Maddie Simens and Amanda Askell and Peter Welinder and Paul F. Christiano and Jan Leike and Ryan Lowe}, title = {Training language models to follow instructions with human feedback}, journal = {CoRR}, volume = {abs/2203.02155}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.02155}, doi = {10.48550/ARXIV.2203.02155}, eprinttype = {arXiv}, eprint = {2203.02155}, timestamp = {Sat, 21 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-02155.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-05802, author = {William Saunders and Catherine Yeh and Jeff Wu and Steven Bills and Long Ouyang and Jonathan Ward and Jan Leike}, title = {Self-critiquing models for assisting human evaluators}, journal = {CoRR}, volume = {abs/2206.05802}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.05802}, doi = {10.48550/ARXIV.2206.05802}, eprinttype = {arXiv}, eprint = {2206.05802}, timestamp = {Mon, 20 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-05802.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-10862, author = {Jeff Wu and Long Ouyang and Daniel M. Ziegler and Nisan Stiennon and Ryan Lowe and Jan Leike and Paul F. Christiano}, title = {Recursively Summarizing Books with Human Feedback}, journal = {CoRR}, volume = {abs/2109.10862}, year = {2021}, url = {https://arxiv.org/abs/2109.10862}, eprinttype = {arXiv}, eprint = {2109.10862}, timestamp = {Mon, 04 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-10862.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2112-09332, author = {Reiichiro Nakano and Jacob Hilton and Suchir Balaji and Jeff Wu and Long Ouyang and Christina Kim and Christopher Hesse and Shantanu Jain and Vineet Kosaraju and William Saunders and Xu Jiang and Karl Cobbe and Tyna Eloundou and Gretchen Krueger and Kevin Button and Matthew Knight and Benjamin Chess and John Schulman}, title = {WebGPT: Browser-assisted question-answering with human feedback}, journal = {CoRR}, volume = {abs/2112.09332}, year = {2021}, url = {https://arxiv.org/abs/2112.09332}, eprinttype = {arXiv}, eprint = {2112.09332}, timestamp = {Mon, 03 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2112-09332.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/StiennonO0ZLVRA20, author = {Nisan Stiennon and Long Ouyang and Jeffrey Wu and Daniel M. Ziegler and Ryan Lowe and Chelsea Voss and Alec Radford and Dario Amodei and Paul F. Christiano}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Learning to summarize with human feedback}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/1f89885d556929e98d3ef9b86448f951-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/StiennonO0ZLVRA20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-01325, author = {Nisan Stiennon and Long Ouyang and Jeff Wu and Daniel M. Ziegler and Ryan Lowe and Chelsea Voss and Alec Radford and Dario Amodei and Paul F. Christiano}, title = {Learning to summarize from human feedback}, journal = {CoRR}, volume = {abs/2009.01325}, year = {2020}, url = {https://arxiv.org/abs/2009.01325}, eprinttype = {arXiv}, eprint = {2009.01325}, timestamp = {Thu, 01 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-01325.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cogsci/OuyangTLG18, author = {Long Ouyang and Michael Henry Tessler and Daniel Ly and Noah D. Goodman}, editor = {Chuck Kalish and Martina A. Rau and Xiaojin (Jerry) Zhu and Timothy T. Rogers}, title = {webppl-oed: {A} practical optimal experiment design system}, booktitle = {Proceedings of the 40th Annual Meeting of the Cognitive Science Society, CogSci 2018, Madison, WI, USA, July 25-28, 2018}, publisher = {cognitivesciencesociety.org}, year = {2018}, url = {https://mindmodeling.org/cogsci2018/papers/0420/index.html}, timestamp = {Wed, 17 Apr 2024 12:43:20 +0200}, biburl = {https://dblp.org/rec/conf/cogsci/OuyangTLG18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1805-08427, author = {Long Ouyang}, title = {Bayesian Inference of Regular Expressions from Human-Generated Example Strings}, journal = {CoRR}, volume = {abs/1805.08427}, year = {2018}, url = {http://arxiv.org/abs/1805.08427}, eprinttype = {arXiv}, eprint = {1805.08427}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1805-08427.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-09401, author = {Long Ouyang and Michael C. Frank}, title = {Pedagogical Learning}, journal = {CoRR}, volume = {abs/1711.09401}, year = {2017}, url = {http://arxiv.org/abs/1711.09401}, eprinttype = {arXiv}, eprint = {1711.09401}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-09401.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/popl/BorgstromGORSS16, author = {Johannes Borgstr{\"{o}}m and Andrew D. Gordon and Long Ouyang and Claudio V. Russo and Adam {\'{S}}cibior and Marcin Szymczak}, editor = {Rastislav Bod{\'{\i}}k and Rupak Majumdar}, title = {Fabular: regression formulas as probabilistic programming}, booktitle = {Proceedings of the 43rd Annual {ACM} {SIGPLAN-SIGACT} Symposium on Principles of Programming Languages, {POPL} 2016, St. Petersburg, FL, USA, January 20 - 22, 2016}, pages = {271--283}, publisher = {{ACM}}, year = {2016}, url = {https://doi.org/10.1145/2837614.2837653}, doi = {10.1145/2837614.2837653}, timestamp = {Mon, 14 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/popl/BorgstromGORSS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/OuyangTLG16, author = {Long Ouyang and Michael Henry Tessler and Daniel Ly and Noah D. Goodman}, title = {Practical optimal experiment design with probabilistic programs}, journal = {CoRR}, volume = {abs/1608.05046}, year = {2016}, url = {http://arxiv.org/abs/1608.05046}, eprinttype = {arXiv}, eprint = {1608.05046}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/OuyangTLG16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cogsci/OuyangBF12, author = {Long Ouyang and Lera Boroditsky and Michael C. Frank}, editor = {Naomi Miyake and David Peebles and Richard P. Cooper}, title = {Semantic Coherence Facilitates Distributional Learning of Word Meanings}, booktitle = {Proceedings of the 34th Annual Meeting of the Cognitive Science Society, CogSci 2012, Sapporo, Japan, August 1-4, 2012}, publisher = {cognitivesciencesociety.org}, year = {2012}, url = {https://escholarship.org/uc/item/7275830t}, timestamp = {Tue, 30 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cogsci/OuyangBF12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.