default search action
BibTeX records: Surya Ganguli
@article{DBLP:journals/neco/KuninSGMTGY24, author = {Daniel Kunin and Javier Sagastuy{-}Bre{\~{n}}a and Lauren Gillespie and Eshed Margalit and Hidenori Tanaka and Surya Ganguli and Daniel L. K. Yamins}, title = {The Limiting Dynamics of {SGD:} Modified Loss, Phase-Space Oscillations, and Anomalous Diffusion}, journal = {Neural Comput.}, volume = {36}, number = {1}, pages = {151--174}, year = {2024}, url = {https://doi.org/10.1162/neco\_a\_01626}, doi = {10.1162/NECO\_A\_01626}, timestamp = {Fri, 22 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/neco/KuninSGMTGY24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-02579, author = {Aditya Cowsik and Tamra Nebabu and Xiao{-}Liang Qi and Surya Ganguli}, title = {Geometric Dynamics of Signal Propagation Predict Trainability of Transformers}, journal = {CoRR}, volume = {abs/2403.02579}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.02579}, doi = {10.48550/ARXIV.2403.02579}, eprinttype = {arXiv}, eprint = {2403.02579}, timestamp = {Wed, 10 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-02579.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2406-06158, author = {Daniel Kunin and Allan Ravent{\'{o}}s and Cl{\'{e}}mentine Domin{\'{e}} and Feng Chen and David Klindt and Andrew M. Saxe and Surya Ganguli}, title = {Get rich quick: exact solutions reveal how unbalanced initializations promote rapid feature learning}, journal = {CoRR}, volume = {abs/2406.06158}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2406.06158}, doi = {10.48550/ARXIV.2406.06158}, eprinttype = {arXiv}, eprint = {2406.06158}, timestamp = {Sat, 13 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2406-06158.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tmlr/LiangBLTSYZNWKN23, author = {Percy Liang and Rishi Bommasani and Tony Lee and Dimitris Tsipras and Dilara Soylu and Michihiro Yasunaga and Yian Zhang and Deepak Narayanan and Yuhuai Wu and Ananya Kumar and Benjamin Newman and Binhang Yuan and Bobby Yan and Ce Zhang and Christian Cosgrove and Christopher D. Manning and Christopher R{\'{e}} and Diana Acosta{-}Navas and Drew A. Hudson and Eric Zelikman and Esin Durmus and Faisal Ladhak and Frieda Rong and Hongyu Ren and Huaxiu Yao and Jue Wang and Keshav Santhanam and Laurel J. Orr and Lucia Zheng and Mert Y{\"{u}}ksekg{\"{o}}n{\"{u}}l and Mirac Suzgun and Nathan Kim and Neel Guha and Niladri S. Chatterji and Omar Khattab and Peter Henderson and Qian Huang and Ryan Chi and Sang Michael Xie and Shibani Santurkar and Surya Ganguli and Tatsunori Hashimoto and Thomas Icard and Tianyi Zhang and Vishrav Chaudhary and William Wang and Xuechen Li and Yifan Mai and Yuhui Zhang and Yuta Koreeda}, title = {Holistic Evaluation of Language Models}, journal = {Trans. Mach. Learn. Res.}, volume = {2023}, year = {2023}, url = {https://openreview.net/forum?id=iO4LZibEqW}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tmlr/LiangBLTSYZNWKN23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/KuninYMG23, author = {Daniel Kunin and Atsushi Yamamura and Chao Ma and Surya Ganguli}, title = {The Asymmetric Maximum Margin Bias of Quasi-Homogeneous Neural Networks}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/forum?id=IM4xp7kGI5V}, timestamp = {Wed, 24 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/KuninYMG23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/PaulCLFGD23, author = {Mansheej Paul and Feng Chen and Brett W. Larsen and Jonathan Frankle and Surya Ganguli and Gintare Karolina Dziugaite}, title = {Unmasking the Lottery Ticket Hypothesis: What's Encoded in a Winning Ticket's Mask?}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/forum?id=xSsW2Am-ukZ}, timestamp = {Wed, 24 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/PaulCLFGD23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WhittingtonDGB23, author = {James C. R. Whittington and Will Dorrell and Surya Ganguli and Timothy Behrens}, title = {Disentanglement with Biological Constraints: {A} Theory of Functional Cell Types}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/forum?id=9Z\_GfhZnGH}, timestamp = {Wed, 24 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WhittingtonDGB23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ChenKYG23, author = {Feng Chen and Daniel Kunin and Atsushi Yamamura and Surya Ganguli}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Stochastic Collapse: How Gradient Noise Attracts {SGD} Dynamics Towards Simpler Subnetworks}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/6e4432b912599d11609b9cdf98c823c5-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/ChenKYG23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DingLMSGB23, author = {Xuehao Ding and Dongsoo Lee and Joshua Melander and George Sivulka and Surya Ganguli and Stephen Baccus}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Information Geometry of the Retinal Representation Manifold}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/8a267516a7a697965c6ae4f48b908605-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/DingLMSGB23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/RaventosPCG23, author = {Allan Ravent{\'{o}}s and Mansheej Paul and Feng Chen and Surya Ganguli}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Pretraining task diversity and the emergence of non-Bayesian in-context learning for regression}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/2e10b2c2e1aa4f8083c37dfe269873f8-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/RaventosPCG23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2303-09540, author = {Amro Abbas and Kushal Tirumala and Daniel Simig and Surya Ganguli and Ari S. Morcos}, title = {SemDeDup: Data-efficient learning at web-scale through semantic deduplication}, journal = {CoRR}, volume = {abs/2303.09540}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2303.09540}, doi = {10.48550/ARXIV.2303.09540}, eprinttype = {arXiv}, eprint = {2303.09540}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2303-09540.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-04251, author = {Feng Chen and Daniel Kunin and Atsushi Yamamura and Surya Ganguli}, title = {Stochastic Collapse: How Gradient Noise Attracts {SGD} Dynamics Towards Simpler Subnetworks}, journal = {CoRR}, volume = {abs/2306.04251}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.04251}, doi = {10.48550/ARXIV.2306.04251}, eprinttype = {arXiv}, eprint = {2306.04251}, timestamp = {Tue, 13 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-04251.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-15063, author = {Allan Ravent{\'{o}}s and Mansheej Paul and Feng Chen and Surya Ganguli}, title = {Pretraining task diversity and the emergence of non-Bayesian in-context learning for regression}, journal = {CoRR}, volume = {abs/2306.15063}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.15063}, doi = {10.48550/ARXIV.2306.15063}, eprinttype = {arXiv}, eprint = {2306.15063}, timestamp = {Fri, 30 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-15063.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/neco/NayebiSBKKGSDY22, author = {Aran Nayebi and Javier Sagastuy{-}Bre{\~{n}}a and Daniel M. Bear and Kohitij Kar and Jonas Kubilius and Surya Ganguli and David Sussillo and James J. DiCarlo and Daniel L. K. Yamins}, title = {Recurrent Connections in the Primate Ventral Visual Stream Mediate a Trade-Off Between Task Performance and Network Size During Core Object Recognition}, journal = {Neural Comput.}, volume = {34}, number = {8}, pages = {1652--1675}, year = {2022}, url = {https://doi.org/10.1162/neco\_a\_01506}, doi = {10.1162/NECO\_A\_01506}, timestamp = {Tue, 26 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/neco/NayebiSBKKGSDY22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ploscb/StockHOG22, author = {Christopher H. Stock and Sarah E. Harvey and Samuel A. Ocko and Surya Ganguli}, title = {Synaptic balancing: {A} biologically plausible local learning rule that provably increases neural network noise robustness without sacrificing task performance}, journal = {PLoS Comput. Biol.}, volume = {18}, number = {9}, pages = {1010418}, year = {2022}, url = {https://doi.org/10.1371/journal.pcbi.1010418}, doi = {10.1371/JOURNAL.PCBI.1010418}, timestamp = {Mon, 28 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ploscb/StockHOG22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ploscb/TimcheckKBG22, author = {Jonathan Timcheck and Jonathan Kadmon and Kwabena Boahen and Surya Ganguli}, title = {Optimal noise level for coding with tightly balanced networks of spiking neurons in the presence of transmission delays}, journal = {PLoS Comput. Biol.}, volume = {18}, number = {10}, pages = {1010593}, year = {2022}, url = {https://doi.org/10.1371/journal.pcbi.1010593}, doi = {10.1371/JOURNAL.PCBI.1010593}, timestamp = {Wed, 17 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ploscb/TimcheckKBG22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/GuptaFG022, author = {Agrim Gupta and Linxi Fan and Surya Ganguli and Li Fei{-}Fei}, title = {MetaMorph: Learning Universal Controllers with Transformers}, booktitle = {The Tenth International Conference on Learning Representations, {ICLR} 2022, Virtual Event, April 25-29, 2022}, publisher = {OpenReview.net}, year = {2022}, url = {https://openreview.net/forum?id=Opmqtk\_GvYL}, timestamp = {Sat, 20 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/GuptaFG022.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/LarsenFBG22, author = {Brett W. Larsen and Stanislav Fort and Nic Becker and Surya Ganguli}, title = {How many degrees of freedom do we need to train deep networks: a loss landscape perspective}, booktitle = {The Tenth International Conference on Learning Representations, {ICLR} 2022, Virtual Event, April 25-29, 2022}, publisher = {OpenReview.net}, year = {2022}, url = {https://openreview.net/forum?id=ChMLTGRjFcU}, timestamp = {Sat, 20 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/LarsenFBG22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PaulLGFD22, author = {Mansheej Paul and Brett W. Larsen and Surya Ganguli and Jonathan Frankle and Gintare Karolina Dziugaite}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Lottery Tickets on a Data Diet: Finding Initializations with Sparse Trainable Networks}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/77dd8e90fe833eba5fae86cf017d7a56-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/PaulLGFD22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SorscherGSGM22, author = {Ben Sorscher and Robert Geirhos and Shashank Shekhar and Surya Ganguli and Ari Morcos}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Beyond neural scaling laws: beating power law scaling via data pruning}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/7b75da9b61eda40fa35453ee5d077df6-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/SorscherGSGM22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-11931, author = {Agrim Gupta and Linxi Fan and Surya Ganguli and Li Fei{-}Fei}, title = {MetaMorph: Learning Universal Controllers with Transformers}, journal = {CoRR}, volume = {abs/2203.11931}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.11931}, doi = {10.48550/ARXIV.2203.11931}, eprinttype = {arXiv}, eprint = {2203.11931}, timestamp = {Tue, 29 Mar 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-11931.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-01278, author = {Mansheej Paul and Brett W. Larsen and Surya Ganguli and Jonathan Frankle and Gintare Karolina Dziugaite}, title = {Lottery Tickets on a Data Diet: Finding Initializations with Sparse Trainable Networks}, journal = {CoRR}, volume = {abs/2206.01278}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.01278}, doi = {10.48550/ARXIV.2206.01278}, eprinttype = {arXiv}, eprint = {2206.01278}, timestamp = {Mon, 13 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-01278.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-14486, author = {Ben Sorscher and Robert Geirhos and Shashank Shekhar and Surya Ganguli and Ari S. Morcos}, title = {Beyond neural scaling laws: beating power law scaling via data pruning}, journal = {CoRR}, volume = {abs/2206.14486}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.14486}, doi = {10.48550/ARXIV.2206.14486}, eprinttype = {arXiv}, eprint = {2206.14486}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-14486.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-01768, author = {James C. R. Whittington and Will Dorrell and Surya Ganguli and Timothy Edward John Behrens}, title = {Disentangling with Biological Constraints: {A} Theory of Functional Cell Types}, journal = {CoRR}, volume = {abs/2210.01768}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.01768}, doi = {10.48550/ARXIV.2210.01768}, eprinttype = {arXiv}, eprint = {2210.01768}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-01768.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-03044, author = {Mansheej Paul and Feng Chen and Brett W. Larsen and Jonathan Frankle and Surya Ganguli and Gintare Karolina Dziugaite}, title = {Unmasking the Lottery Ticket Hypothesis: What's Encoded in a Winning Ticket's Mask?}, journal = {CoRR}, volume = {abs/2210.03044}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.03044}, doi = {10.48550/ARXIV.2210.03044}, eprinttype = {arXiv}, eprint = {2210.03044}, timestamp = {Fri, 07 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-03044.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-03820, author = {Daniel Kunin and Atsushi Yamamura and Chao Ma and Surya Ganguli}, title = {The Asymmetric Maximum Margin Bias of Quasi-Homogeneous Neural Networks}, journal = {CoRR}, volume = {abs/2210.03820}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.03820}, doi = {10.48550/ARXIV.2210.03820}, eprinttype = {arXiv}, eprint = {2210.03820}, timestamp = {Wed, 12 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-03820.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-05546, author = {Stanislav Fort and Ekin Dogus Cubuk and Surya Ganguli and Samuel S. Schoenholz}, title = {What does a deep neural network confidently perceive? The effective dimension of high certainty class manifolds and their low confidence boundaries}, journal = {CoRR}, volume = {abs/2210.05546}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.05546}, doi = {10.48550/ARXIV.2210.05546}, eprinttype = {arXiv}, eprint = {2210.05546}, timestamp = {Thu, 13 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-05546.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-08340, author = {Anthony Zador and Blake A. Richards and Bence {\"{O}}lveczky and Sean Escola and Yoshua Bengio and Kwabena Boahen and Matthew M. Botvinick and Dmitri B. Chklovskii and Anne Churchland and Claudia Clopath and James DiCarlo and Surya Ganguli and Jeff Hawkins and Konrad P. K{\"{o}}rding and Alexei A. Koulakov and Yann LeCun and Timothy P. Lillicrap and Adam H. Marblestone and Bruno A. Olshausen and Alexandre Pouget and Cristina Savin and Terrence J. Sejnowski and Eero P. Simoncelli and Sara A. Solla and David Sussillo and Andreas S. Tolias and Doris Tsao}, title = {Toward Next-Generation Artificial Intelligence: Catalyzing the NeuroAI Revolution}, journal = {CoRR}, volume = {abs/2210.08340}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.08340}, doi = {10.48550/ARXIV.2210.08340}, eprinttype = {arXiv}, eprint = {2210.08340}, timestamp = {Sun, 04 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-08340.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-09110, author = {Percy Liang and Rishi Bommasani and Tony Lee and Dimitris Tsipras and Dilara Soylu and Michihiro Yasunaga and Yian Zhang and Deepak Narayanan and Yuhuai Wu and Ananya Kumar and Benjamin Newman and Binhang Yuan and Bobby Yan and Ce Zhang and Christian Cosgrove and Christopher D. Manning and Christopher R{\'{e}} and Diana Acosta{-}Navas and Drew A. Hudson and Eric Zelikman and Esin Durmus and Faisal Ladhak and Frieda Rong and Hongyu Ren and Huaxiu Yao and Jue Wang and Keshav Santhanam and Laurel J. Orr and Lucia Zheng and Mert Y{\"{u}}ksekg{\"{o}}n{\"{u}}l and Mirac Suzgun and Nathan Kim and Neel Guha and Niladri S. Chatterji and Omar Khattab and Peter Henderson and Qian Huang and Ryan Chi and Sang Michael Xie and Shibani Santurkar and Surya Ganguli and Tatsunori Hashimoto and Thomas Icard and Tianyi Zhang and Vishrav Chaudhary and William Wang and Xuechen Li and Yifan Mai and Yuhui Zhang and Yuta Koreeda}, title = {Holistic Evaluation of Language Models}, journal = {CoRR}, volume = {abs/2211.09110}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.09110}, doi = {10.48550/ARXIV.2211.09110}, eprinttype = {arXiv}, eprint = {2211.09110}, timestamp = {Thu, 08 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-09110.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/KuninSGYT21, author = {Daniel Kunin and Javier Sagastuy{-}Bre{\~{n}}a and Surya Ganguli and Daniel L. K. Yamins and Hidenori Tanaka}, title = {Neural Mechanics: Symmetry and Broken Conservation Laws in Deep Learning Dynamics}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=q8qLAbQBupm}, timestamp = {Thu, 21 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/KuninSGYT21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/MelG21, author = {Gabriel Mel and Surya Ganguli}, editor = {Marina Meila and Tong Zhang}, title = {A theory of high dimensional regression with arbitrary correlations between input features and target functions: sample complexity, multiple descent curves and a hierarchy of phase transitions}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {7578--7587}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/mel21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/MelG21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/TianCG21, author = {Yuandong Tian and Xinlei Chen and Surya Ganguli}, editor = {Marina Meila and Tong Zhang}, title = {Understanding self-supervised learning dynamics without contrastive pairs}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {10268--10278}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/tian21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/TianCG21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/NayebiACHLMMSWG21, author = {Aran Nayebi and Alexander Attinger and Malcolm Campbell and Kiah Hardcastle and Isabel Low and Caitlin S. Mallory and Gabriel Mel and Ben Sorscher and Alex H. Williams and Surya Ganguli and Lisa M. Giocomo and Daniel L. K. Yamins}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Explaining heterogeneity in medial entorhinal cortex with task-driven neural networks}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {12167--12179}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/656f0dbf9392657eed7feefc486781fb-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/NayebiACHLMMSWG21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PaulGD21, author = {Mansheej Paul and Surya Ganguli and Gintare Karolina Dziugaite}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Deep Learning on a Data Diet: Finding Important Examples Early in Training}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {20596--20607}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/ac56f8fe9eea3e4a365f29f0f1957c55-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/PaulGD21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-02202, author = {Agrim Gupta and Silvio Savarese and Surya Ganguli and Li Fei{-}Fei}, title = {Embodied Intelligence via Learning and Evolution}, journal = {CoRR}, volume = {abs/2102.02202}, year = {2021}, url = {https://arxiv.org/abs/2102.02202}, eprinttype = {arXiv}, eprint = {2102.02202}, timestamp = {Tue, 09 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-02202.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-06810, author = {Yuandong Tian and Xinlei Chen and Surya Ganguli}, title = {Understanding self-supervised Learning Dynamics without Contrastive Pairs}, journal = {CoRR}, volume = {abs/2102.06810}, year = {2021}, url = {https://arxiv.org/abs/2102.06810}, eprinttype = {arXiv}, eprint = {2102.06810}, timestamp = {Thu, 18 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-06810.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-05802, author = {Brett W. Larsen and Stanislav Fort and Nic Becker and Surya Ganguli}, title = {How many degrees of freedom do we need to train deep networks: a loss landscape perspective}, journal = {CoRR}, volume = {abs/2107.05802}, year = {2021}, url = {https://arxiv.org/abs/2107.05802}, eprinttype = {arXiv}, eprint = {2107.05802}, timestamp = {Tue, 20 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-05802.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-07075, author = {Mansheej Paul and Surya Ganguli and Gintare Karolina Dziugaite}, title = {Deep Learning on a Data Diet: Finding Important Examples Early in Training}, journal = {CoRR}, volume = {abs/2107.07075}, year = {2021}, url = {https://arxiv.org/abs/2107.07075}, eprinttype = {arXiv}, eprint = {2107.07075}, timestamp = {Wed, 21 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-07075.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-09133, author = {Daniel Kunin and Javier Sagastuy{-}Bre{\~{n}}a and Lauren Gillespie and Eshed Margalit and Hidenori Tanaka and Surya Ganguli and Daniel L. K. Yamins}, title = {Rethinking the limiting dynamics of {SGD:} modified loss, phase space oscillations, and anomalous diffusion}, journal = {CoRR}, volume = {abs/2107.09133}, year = {2021}, url = {https://arxiv.org/abs/2107.09133}, eprinttype = {arXiv}, eprint = {2107.09133}, timestamp = {Thu, 29 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-09133.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/nature/RumyantsevLHZSC20, author = {Oleg I. Rumyantsev and J{\'{e}}r{\^{o}}me A. Lecoq and Oscar Hernandez and Yanping Zhang and Joan Savall and Radoslaw Chrapkiewicz and Jane Li and Hongkui Zeng and Surya Ganguli and Mark J. Schnitzer}, title = {Fundamental bounds on the fidelity of sensory cortical coding}, journal = {Nat.}, volume = {580}, number = {7801}, pages = {100--105}, year = {2020}, url = {https://doi.org/10.1038/s41586-020-2130-2}, doi = {10.1038/S41586-020-2130-2}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/nature/RumyantsevLHZSC20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/HewittHGLM20, author = {John Hewitt and Michael Hahn and Surya Ganguli and Percy Liang and Christopher D. Manning}, editor = {Bonnie Webber and Trevor Cohn and Yulan He and Yang Liu}, title = {RNNs can generate bounded hierarchical languages with optimal memory}, booktitle = {Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2020, Online, November 16-20, 2020}, pages = {1978--2010}, publisher = {Association for Computational Linguistics}, year = {2020}, url = {https://doi.org/10.18653/v1/2020.emnlp-main.156}, doi = {10.18653/V1/2020.EMNLP-MAIN.156}, timestamp = {Tue, 20 Aug 2024 07:54:43 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/HewittHGLM20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KuninNSGBY20, author = {Daniel Kunin and Aran Nayebi and Javier Sagastuy{-}Bre{\~{n}}a and Surya Ganguli and Jonathan M. Bloom and Daniel Yamins}, title = {Two Routes to Scalable Credit Assignment without Weight Symmetry}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {5511--5521}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/kunin20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/KuninNSGBY20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/FortDPK0G20, author = {Stanislav Fort and Gintare Karolina Dziugaite and Mansheej Paul and Sepideh Kharaghani and Daniel M. Roy and Surya Ganguli}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Deep learning versus kernel learning: an empirical study of loss landscape geometry and the time evolution of the Neural Tangent Kernel}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/405075699f065e43581f27d67bb68478-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/FortDPK0G20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/KadmonTG20, author = {Jonathan Kadmon and Jonathan Timcheck and Surya Ganguli}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Predictive coding in balanced neural networks with noise, chaos and delays}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/c236337b043acf93c7df397fdb9082b3-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/KadmonTG20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/NayebiSGY20, author = {Aran Nayebi and Sanjana Srivastava and Surya Ganguli and Daniel L. K. Yamins}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Identifying Learning Rules From Neural Network Observables}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/1ba922ac006a8e5f2b123684c2f4d65f-Abstract.html}, timestamp = {Thu, 21 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/NayebiSGY20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/TanakaKYG20, author = {Hidenori Tanaka and Daniel Kunin and Daniel L. K. Yamins and Surya Ganguli}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Pruning neural networks without any data by iteratively conserving synaptic flow}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/46a4378f835dc8040c8057beb6a2da52-Abstract.html}, timestamp = {Thu, 21 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/TanakaKYG20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-01513, author = {Daniel Kunin and Aran Nayebi and Javier Sagastuy{-}Bre{\~{n}}a and Surya Ganguli and Jonathan M. Bloom and Daniel L. K. Yamins}, title = {Two Routes to Scalable Credit Assignment without Weight Symmetry}, journal = {CoRR}, volume = {abs/2003.01513}, year = {2020}, url = {https://arxiv.org/abs/2003.01513}, eprinttype = {arXiv}, eprint = {2003.01513}, timestamp = {Tue, 10 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-01513.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-05467, author = {Hidenori Tanaka and Daniel Kunin and Daniel L. K. Yamins and Surya Ganguli}, title = {Pruning neural networks without any data by iteratively conserving synaptic flow}, journal = {CoRR}, volume = {abs/2006.05467}, year = {2020}, url = {https://arxiv.org/abs/2006.05467}, eprinttype = {arXiv}, eprint = {2006.05467}, timestamp = {Sat, 13 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-05467.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-00578, author = {Yuandong Tian and Lantao Yu and Xinlei Chen and Surya Ganguli}, title = {Understanding Self-supervised Learning with Dual Deep Networks}, journal = {CoRR}, volume = {abs/2010.00578}, year = {2020}, url = {https://arxiv.org/abs/2010.00578}, eprinttype = {arXiv}, eprint = {2010.00578}, timestamp = {Mon, 12 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-00578.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-07515, author = {John Hewitt and Michael Hahn and Surya Ganguli and Percy Liang and Christopher D. Manning}, title = {RNNs can generate bounded hierarchical languages with optimal memory}, journal = {CoRR}, volume = {abs/2010.07515}, year = {2020}, url = {https://arxiv.org/abs/2010.07515}, eprinttype = {arXiv}, eprint = {2010.07515}, timestamp = {Wed, 21 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-07515.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-11765, author = {Aran Nayebi and Sanjana Srivastava and Surya Ganguli and Daniel L. K. Yamins}, title = {Identifying Learning Rules From Neural Network Observables}, journal = {CoRR}, volume = {abs/2010.11765}, year = {2020}, url = {https://arxiv.org/abs/2010.11765}, eprinttype = {arXiv}, eprint = {2010.11765}, timestamp = {Tue, 27 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-11765.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-15110, author = {Stanislav Fort and Gintare Karolina Dziugaite and Mansheej Paul and Sepideh Kharaghani and Daniel M. Roy and Surya Ganguli}, title = {Deep learning versus kernel learning: an empirical study of loss landscape geometry and the time evolution of the Neural Tangent Kernel}, journal = {CoRR}, volume = {abs/2010.15110}, year = {2020}, url = {https://arxiv.org/abs/2010.15110}, eprinttype = {arXiv}, eprint = {2010.15110}, timestamp = {Tue, 03 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-15110.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-04728, author = {Daniel Kunin and Javier Sagastuy{-}Bre{\~{n}}a and Surya Ganguli and Daniel L. K. Yamins and Hidenori Tanaka}, title = {Neural Mechanics: Symmetry and Broken Conservation Laws in Deep Learning Dynamics}, journal = {CoRR}, volume = {abs/2012.04728}, year = {2020}, url = {https://arxiv.org/abs/2012.04728}, eprinttype = {arXiv}, eprint = {2012.04728}, timestamp = {Sat, 02 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-04728.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/LampinenG19, author = {Andrew K. Lampinen and Surya Ganguli}, title = {An analytic theory of generalization dynamics and transfer learning in deep linear networks}, booktitle = {7th International Conference on Learning Representations, {ICLR} 2019, New Orleans, LA, USA, May 6-9, 2019}, publisher = {OpenReview.net}, year = {2019}, url = {https://openreview.net/forum?id=ryfMLoCqtQ}, timestamp = {Thu, 25 Jul 2019 13:03:15 +0200}, biburl = {https://dblp.org/rec/conf/iclr/LampinenG19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/LindseyOGD19, author = {Jack Lindsey and Samuel A. Ocko and Surya Ganguli and St{\'{e}}phane Deny}, title = {A Unified Theory of Early Visual Representations from Retina to Cortex through Anatomically Constrained Deep CNNs}, booktitle = {7th International Conference on Learning Representations, {ICLR} 2019, New Orleans, LA, USA, May 6-9, 2019}, publisher = {OpenReview.net}, year = {2019}, url = {https://openreview.net/forum?id=S1xq3oR5tQ}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/LindseyOGD19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/TanakaNMMBG19, author = {Hidenori Tanaka and Aran Nayebi and Niru Maheswaranathan and Lane McIntosh and Stephen Baccus and Surya Ganguli}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {From deep learning to mechanistic understanding in neuroscience: the structure of retinal prediction}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {8535--8545}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/eeaebbffb5d29ff62799637fc51adb7b-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/TanakaNMMBG19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SorscherMGO19, author = {Ben Sorscher and Gabriel Mel and Surya Ganguli and Samuel A. Ocko}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {A unified theory for the origin of grid cells through the lens of pattern formation}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {10003--10013}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/6e7d5d259be7bf56ed79029c4e621f44-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/SorscherMGO19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/Maheswaranathan19, author = {Niru Maheswaranathan and Alex H. Williams and Matthew D. Golub and Surya Ganguli and David Sussillo}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {Universality and individuality in neural dynamics across large populations of recurrent networks}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {15603--15615}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/5f5d472067f77b5c88f69f1bcfda1e08-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/Maheswaranathan19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/Maheswaranathan19a, author = {Niru Maheswaranathan and Alex H. Williams and Matthew D. Golub and Surya Ganguli and David Sussillo}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {Reverse engineering recurrent networks for sentiment classification reveals line attractor dynamics}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {15670--15679}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/d921c3c762b1522c475ac8fc0811bb0f-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/Maheswaranathan19a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1901-00945, author = {Jack Lindsey and Samuel A. Ocko and Surya Ganguli and St{\'{e}}phane Deny}, title = {A Unified Theory of Early Visual Representations from Retina to Cortex through Anatomically Constrained Deep CNNs}, journal = {CoRR}, volume = {abs/1901.00945}, year = {2019}, url = {http://arxiv.org/abs/1901.00945}, eprinttype = {arXiv}, eprint = {1901.00945}, timestamp = {Sun, 03 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1901-00945.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-10720, author = {Niru Maheswaranathan and Alex H. Williams and Matthew D. Golub and Surya Ganguli and David Sussillo}, title = {Reverse engineering recurrent networks for sentiment classification reveals line attractor dynamics}, journal = {CoRR}, volume = {abs/1906.10720}, year = {2019}, url = {http://arxiv.org/abs/1906.10720}, eprinttype = {arXiv}, eprint = {1906.10720}, timestamp = {Mon, 08 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-10720.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-00139, author = {Anthony Degleris and Ben Antin and Surya Ganguli and Alex H. Williams}, title = {Fast Convolutive Nonnegative Matrix Factorization Through Coordinate and Block Coordinate Updates}, journal = {CoRR}, volume = {abs/1907.00139}, year = {2019}, url = {http://arxiv.org/abs/1907.00139}, eprinttype = {arXiv}, eprint = {1907.00139}, timestamp = {Mon, 08 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-00139.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-08549, author = {Niru Maheswaranathan and Alex H. Williams and Matthew D. Golub and Surya Ganguli and David Sussillo}, title = {Universality and individuality in neural dynamics across large populations of recurrent networks}, journal = {CoRR}, volume = {abs/1907.08549}, year = {2019}, url = {http://arxiv.org/abs/1907.08549}, eprinttype = {arXiv}, eprint = {1907.08549}, timestamp = {Tue, 23 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-08549.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-05929, author = {Stanislav Fort and Surya Ganguli}, title = {Emergent properties of the local geometry of neural loss landscapes}, journal = {CoRR}, volume = {abs/1910.05929}, year = {2019}, url = {http://arxiv.org/abs/1910.05929}, eprinttype = {arXiv}, eprint = {1910.05929}, timestamp = {Wed, 16 Oct 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-05929.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-06207, author = {Hidenori Tanaka and Aran Nayebi and Niru Maheswaranathan and Lane McIntosh and Stephen A. Baccus and Surya Ganguli}, title = {From deep learning to mechanistic understanding in neuroscience: the structure of retinal prediction}, journal = {CoRR}, volume = {abs/1912.06207}, year = {2019}, url = {http://arxiv.org/abs/1912.06207}, eprinttype = {arXiv}, eprint = {1912.06207}, timestamp = {Tue, 07 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-06207.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/neco/ZenkeG18, author = {Friedemann Zenke and Surya Ganguli}, title = {SuperSpike: Supervised Learning in Multilayer Spiking Neural Networks}, journal = {Neural Comput.}, volume = {30}, number = {6}, year = {2018}, url = {https://doi.org/10.1162/neco\_a\_01086}, doi = {10.1162/NECO\_A\_01086}, timestamp = {Tue, 07 May 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/neco/ZenkeG18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ploscb/Maheswaranathan18, author = {Niru Maheswaranathan and David B. Kastner and Stephen A. Baccus and Surya Ganguli}, title = {Inferring hidden structure in multilayered neural circuits}, journal = {PLoS Comput. Biol.}, volume = {14}, number = {8}, year = {2018}, url = {https://doi.org/10.1371/journal.pcbi.1006291}, doi = {10.1371/JOURNAL.PCBI.1006291}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ploscb/Maheswaranathan18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/PenningtonSG18, author = {Jeffrey Pennington and Samuel S. Schoenholz and Surya Ganguli}, editor = {Amos J. Storkey and Fernando P{\'{e}}rez{-}Cruz}, title = {The emergence of spectral universality in deep networks}, booktitle = {International Conference on Artificial Intelligence and Statistics, {AISTATS} 2018, 9-11 April 2018, Playa Blanca, Lanzarote, Canary Islands, Spain}, series = {Proceedings of Machine Learning Research}, volume = {84}, pages = {1924--1932}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v84/pennington18a.html}, timestamp = {Wed, 03 Apr 2019 18:17:22 +0200}, biburl = {https://dblp.org/rec/conf/aistats/PenningtonSG18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/NayebiBKKGSDY18, author = {Aran Nayebi and Daniel Bear and Jonas Kubilius and Kohitij Kar and Surya Ganguli and David Sussillo and James J. DiCarlo and Daniel L. K. Yamins}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {Task-Driven Convolutional Recurrent Models of the Visual System}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {5295--5306}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/6be93f7a96fed60c477d30ae1de032fd-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/NayebiBKKGSDY18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/KadmonG18, author = {Jonathan Kadmon and Surya Ganguli}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {Statistical mechanics of low-rank tensor decomposition}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {8212--8222}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/b3848d61bbbc6207c6668a8a9e2730ed-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/KadmonG18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/OckoLGD18, author = {Samuel A. Ocko and Jack Lindsey and Surya Ganguli and St{\'{e}}phane Deny}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {The emergence of multiple retinal cell types through efficient coding of natural movies}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {9411--9422}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/d94fd74dcde1aa553be72c1006578b23-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/OckoLGD18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1802-09979, author = {Jeffrey Pennington and Samuel S. Schoenholz and Surya Ganguli}, title = {The Emergence of Spectral Universality in Deep Networks}, journal = {CoRR}, volume = {abs/1802.09979}, year = {2018}, url = {http://arxiv.org/abs/1802.09979}, eprinttype = {arXiv}, eprint = {1802.09979}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1802-09979.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1807-00053, author = {Aran Nayebi and Daniel Bear and Jonas Kubilius and Kohitij Kar and Surya Ganguli and David Sussillo and James J. DiCarlo and Daniel L. K. Yamins}, title = {Task-Driven Convolutional Recurrent Models of the Visual System}, journal = {CoRR}, volume = {abs/1807.00053}, year = {2018}, url = {http://arxiv.org/abs/1807.00053}, eprinttype = {arXiv}, eprint = {1807.00053}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1807-00053.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-10374, author = {Andrew K. Lampinen and Surya Ganguli}, title = {An analytic theory of generalization dynamics and transfer learning in deep linear networks}, journal = {CoRR}, volume = {abs/1809.10374}, year = {2018}, url = {http://arxiv.org/abs/1809.10374}, eprinttype = {arXiv}, eprint = {1809.10374}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-10374.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-10065, author = {Jonathan Kadmon and Surya Ganguli}, title = {Statistical mechanics of low-rank tensor decomposition}, journal = {CoRR}, volume = {abs/1810.10065}, year = {2018}, url = {http://arxiv.org/abs/1810.10065}, eprinttype = {arXiv}, eprint = {1810.10065}, timestamp = {Thu, 01 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-10065.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-10531, author = {Andrew M. Saxe and James L. McClelland and Surya Ganguli}, title = {A mathematical theory of semantic development in deep neural networks}, journal = {CoRR}, volume = {abs/1810.10531}, year = {2018}, url = {http://arxiv.org/abs/1810.10531}, eprinttype = {arXiv}, eprint = {1810.10531}, timestamp = {Wed, 31 Oct 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-10531.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jossw/NaeckerMGB17, author = {Benjamin Naecker and Niru Maheswaranathan and Surya Ganguli and Stephen Baccus}, title = {Pyret: {A} Python package for analysis of neurophysiology data}, journal = {J. Open Source Softw.}, volume = {2}, number = {9}, pages = {137}, year = {2017}, url = {https://doi.org/10.21105/joss.00137}, doi = {10.21105/JOSS.00137}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jossw/NaeckerMGB17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/PooleZG17, author = {Ben Poole and Friedemann Zenke and Surya Ganguli}, title = {Intelligent synapses for multi-task and transfer learning}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=rJzabxSFg}, timestamp = {Thu, 04 Apr 2019 13:20:08 +0200}, biburl = {https://dblp.org/rec/conf/iclr/PooleZG17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/SchoenholzGGS17, author = {Samuel S. Schoenholz and Justin Gilmer and Surya Ganguli and Jascha Sohl{-}Dickstein}, title = {Deep Information Propagation}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=H1W1UN9gg}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/SchoenholzGGS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/RaghuPKGS17, author = {Maithra Raghu and Ben Poole and Jon M. Kleinberg and Surya Ganguli and Jascha Sohl{-}Dickstein}, editor = {Doina Precup and Yee Whye Teh}, title = {On the Expressive Power of Deep Neural Networks}, booktitle = {Proceedings of the 34th International Conference on Machine Learning, {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017}, series = {Proceedings of Machine Learning Research}, volume = {70}, pages = {2847--2854}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v70/raghu17a.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/RaghuPKGS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/ZenkePG17, author = {Friedemann Zenke and Ben Poole and Surya Ganguli}, editor = {Doina Precup and Yee Whye Teh}, title = {Continual Learning Through Synaptic Intelligence}, booktitle = {Proceedings of the 34th International Conference on Machine Learning, {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017}, series = {Proceedings of Machine Learning Research}, volume = {70}, pages = {3987--3995}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v70/zenke17a.html}, timestamp = {Tue, 07 May 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/ZenkePG17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/GoyalKGB17, author = {Anirudh Goyal and Nan Rosemary Ke and Surya Ganguli and Yoshua Bengio}, editor = {Isabelle Guyon and Ulrike von Luxburg and Samy Bengio and Hanna M. Wallach and Rob Fergus and S. V. N. Vishwanathan and Roman Garnett}, title = {Variational Walkback: Learning a Transition Operator as a Stochastic Recurrent Net}, booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4-9, 2017, Long Beach, CA, {USA}}, pages = {4392--4402}, year = {2017}, url = {https://proceedings.neurips.cc/paper/2017/hash/46a558d97954d0692411c861cf78ef79-Abstract.html}, timestamp = {Thu, 21 Jan 2021 13:58:27 +0100}, biburl = {https://dblp.org/rec/conf/nips/GoyalKGB17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PenningtonSG17, author = {Jeffrey Pennington and Samuel S. Schoenholz and Surya Ganguli}, editor = {Isabelle Guyon and Ulrike von Luxburg and Samy Bengio and Hanna M. Wallach and Rob Fergus and S. V. N. Vishwanathan and Roman Garnett}, title = {Resurrecting the sigmoid in deep learning through dynamical isometry: theory and practice}, booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4-9, 2017, Long Beach, CA, {USA}}, pages = {4785--4795}, year = {2017}, url = {https://proceedings.neurips.cc/paper/2017/hash/d9fc0cdb67638d50f411432d0d41d0ba-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/PenningtonSG17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/ZenkePG17, author = {Friedemann Zenke and Ben Poole and Surya Ganguli}, title = {Improved multitask learning through synaptic intelligence}, journal = {CoRR}, volume = {abs/1703.04200}, year = {2017}, url = {http://arxiv.org/abs/1703.04200}, eprinttype = {arXiv}, eprint = {1703.04200}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/ZenkePG17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/NayebiG17, author = {Aran Nayebi and Surya Ganguli}, title = {Biologically inspired protection of deep networks from adversarial attacks}, journal = {CoRR}, volume = {abs/1703.09202}, year = {2017}, url = {http://arxiv.org/abs/1703.09202}, eprinttype = {arXiv}, eprint = {1703.09202}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/NayebiG17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/ZenkeG17, author = {Friedemann Zenke and Surya Ganguli}, title = {SuperSpike: Supervised learning in multi-layer spiking neural networks}, journal = {CoRR}, volume = {abs/1705.11146}, year = {2017}, url = {http://arxiv.org/abs/1705.11146}, eprinttype = {arXiv}, eprint = {1705.11146}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/ZenkeG17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-02282, author = {Anirudh Goyal and Nan Rosemary Ke and Surya Ganguli and Yoshua Bengio}, title = {Variational Walkback: Learning a Transition Operator as a Stochastic Recurrent Net}, journal = {CoRR}, volume = {abs/1711.02282}, year = {2017}, url = {http://arxiv.org/abs/1711.02282}, eprinttype = {arXiv}, eprint = {1711.02282}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-02282.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-04735, author = {Jeffrey Pennington and Samuel S. Schoenholz and Surya Ganguli}, title = {Resurrecting the sigmoid in deep learning through dynamical isometry: theory and practice}, journal = {CoRR}, volume = {abs/1711.04735}, year = {2017}, url = {http://arxiv.org/abs/1711.04735}, eprinttype = {arXiv}, eprint = {1711.04735}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-04735.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/McIntoshMNGB16, author = {Lane McIntosh and Niru Maheswaranathan and Aran Nayebi and Surya Ganguli and Stephen Baccus}, editor = {Daniel D. Lee and Masashi Sugiyama and Ulrike von Luxburg and Isabelle Guyon and Roman Garnett}, title = {Deep Learning Models of the Retinal Response to Natural Scenes}, booktitle = {Advances in Neural Information Processing Systems 29: Annual Conference on Neural Information Processing Systems 2016, December 5-10, 2016, Barcelona, Spain}, pages = {1361--1369}, year = {2016}, url = {https://proceedings.neurips.cc/paper/2016/hash/a1d33d0dfec820b41b54430b50e96b5c-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/McIntoshMNGB16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PooleLRSG16, author = {Ben Poole and Subhaneil Lahiri and Maithra Raghu and Jascha Sohl{-}Dickstein and Surya Ganguli}, editor = {Daniel D. Lee and Masashi Sugiyama and Ulrike von Luxburg and Isabelle Guyon and Roman Garnett}, title = {Exponential expressivity in deep neural networks through transient chaos}, booktitle = {Advances in Neural Information Processing Systems 29: Annual Conference on Neural Information Processing Systems 2016, December 5-10, 2016, Barcelona, Spain}, pages = {3360--3368}, year = {2016}, url = {https://proceedings.neurips.cc/paper/2016/hash/148510031349642de5ca0c544f31b2ef-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/PooleLRSG16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/AdvaniG16, author = {Madhu Advani and Surya Ganguli}, editor = {Daniel D. Lee and Masashi Sugiyama and Ulrike von Luxburg and Isabelle Guyon and Roman Garnett}, title = {An equivalence between high dimensional Bayes optimal inference and M-estimation}, booktitle = {Advances in Neural Information Processing Systems 29: Annual Conference on Neural Information Processing Systems 2016, December 5-10, 2016, Barcelona, Spain}, pages = {3378--3386}, year = {2016}, url = {https://proceedings.neurips.cc/paper/2016/hash/08e6bea8e90ba87af3c9554d94db6579-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/AdvaniG16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LahiriSG16, author = {Subhaneil Lahiri and Jascha Sohl{-}Dickstein and Surya Ganguli}, title = {A universal tradeoff between power, precision and speed in physical communication}, journal = {CoRR}, volume = {abs/1603.07758}, year = {2016}, url = {http://arxiv.org/abs/1603.07758}, eprinttype = {arXiv}, eprint = {1603.07758}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/LahiriSG16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/RaghuPKGS16, author = {Maithra Raghu and Ben Poole and Jon M. Kleinberg and Surya Ganguli and Jascha Sohl{-}Dickstein}, title = {On the expressive power of deep neural networks}, journal = {CoRR}, volume = {abs/1606.05336}, year = {2016}, url = {http://arxiv.org/abs/1606.05336}, eprinttype = {arXiv}, eprint = {1606.05336}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/RaghuPKGS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/PooleLRSG16, author = {Ben Poole and Subhaneil Lahiri and Maithra Raghu and Jascha Sohl{-}Dickstein and Surya Ganguli}, title = {Exponential expressivity in deep neural networks through transient chaos}, journal = {CoRR}, volume = {abs/1606.05340}, year = {2016}, url = {http://arxiv.org/abs/1606.05340}, eprinttype = {arXiv}, eprint = {1606.05340}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/PooleLRSG16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LahiriGG16, author = {Subhaneil Lahiri and Peiran Gao and Surya Ganguli}, title = {Random projections of random manifolds}, journal = {CoRR}, volume = {abs/1607.04331}, year = {2016}, url = {http://arxiv.org/abs/1607.04331}, eprinttype = {arXiv}, eprint = {1607.04331}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/LahiriGG16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SchoenholzGGS16, author = {Samuel S. Schoenholz and Justin Gilmer and Surya Ganguli and Jascha Sohl{-}Dickstein}, title = {Deep Information Propagation}, journal = {CoRR}, volume = {abs/1611.01232}, year = {2016}, url = {http://arxiv.org/abs/1611.01232}, eprinttype = {arXiv}, eprint = {1611.01232}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SchoenholzGGS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/RaghuPKGS16a, author = {Maithra Raghu and Ben Poole and Jon M. Kleinberg and Surya Ganguli and Jascha Sohl{-}Dickstein}, title = {Survey of Expressivity in Deep Neural Networks}, journal = {CoRR}, volume = {abs/1611.08083}, year = {2016}, url = {http://arxiv.org/abs/1611.08083}, eprinttype = {arXiv}, eprint = {1611.08083}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/RaghuPKGS16a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ficn/BouchardGB15, author = {Kristofer E. Bouchard and Surya Ganguli and Michael S. Brainard}, title = {Role of the site of synaptic competition and the balance of learning forces for Hebbian encoding of probabilistic Markov sequences}, journal = {Frontiers Comput. Neurosci.}, volume = {9}, pages = {92}, year = {2015}, url = {https://doi.org/10.3389/fncom.2015.00092}, doi = {10.3389/FNCOM.2015.00092}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ficn/BouchardGB15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/Sohl-DicksteinW15, author = {Jascha Sohl{-}Dickstein and Eric A. Weiss and Niru Maheswaranathan and Surya Ganguli}, editor = {Francis R. Bach and David M. Blei}, title = {Deep Unsupervised Learning using Nonequilibrium Thermodynamics}, booktitle = {Proceedings of the 32nd International Conference on Machine Learning, {ICML} 2015, Lille, France, 6-11 July 2015}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {37}, pages = {2256--2265}, publisher = {JMLR.org}, year = {2015}, url = {http://proceedings.mlr.press/v37/sohl-dickstein15.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/Sohl-DicksteinW15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PiechBHGSGS15, author = {Chris Piech and Jonathan Bassen and Jonathan Huang and Surya Ganguli and Mehran Sahami and Leonidas J. Guibas and Jascha Sohl{-}Dickstein}, editor = {Corinna Cortes and Neil D. Lawrence and Daniel D. Lee and Masashi Sugiyama and Roman Garnett}, title = {Deep Knowledge Tracing}, booktitle = {Advances in Neural Information Processing Systems 28: Annual Conference on Neural Information Processing Systems 2015, December 7-12, 2015, Montreal, Quebec, Canada}, pages = {505--513}, year = {2015}, url = {https://proceedings.neurips.cc/paper/2015/hash/bac9162b47c56fc8a4d2a519803d51b3-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/PiechBHGSGS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/Sohl-DicksteinW15, author = {Jascha Sohl{-}Dickstein and Eric A. Weiss and Niru Maheswaranathan and Surya Ganguli}, title = {Deep Unsupervised Learning using Nonequilibrium Thermodynamics}, journal = {CoRR}, volume = {abs/1503.03585}, year = {2015}, url = {http://arxiv.org/abs/1503.03585}, eprinttype = {arXiv}, eprint = {1503.03585}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/Sohl-DicksteinW15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/PiechSHGSGS15, author = {Chris Piech and Jonathan Spencer and Jonathan Huang and Surya Ganguli and Mehran Sahami and Leonidas J. Guibas and Jascha Sohl{-}Dickstein}, title = {Deep Knowledge Tracing}, journal = {CoRR}, volume = {abs/1506.05908}, year = {2015}, url = {http://arxiv.org/abs/1506.05908}, eprinttype = {arXiv}, eprint = {1506.05908}, timestamp = {Tue, 25 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/PiechSHGSGS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/Sohl-DicksteinPG14, author = {Jascha Sohl{-}Dickstein and Ben Poole and Surya Ganguli}, title = {Fast large-scale optimization by unifying stochastic gradient and quasi-Newton methods}, booktitle = {Proceedings of the 31th International Conference on Machine Learning, {ICML} 2014, Beijing, China, 21-26 June 2014}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {32}, pages = {604--612}, publisher = {JMLR.org}, year = {2014}, url = {http://proceedings.mlr.press/v32/sohl-dicksteinb14.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/Sohl-DicksteinPG14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DauphinPGCGB14, author = {Yann N. Dauphin and Razvan Pascanu and {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and KyungHyun Cho and Surya Ganguli and Yoshua Bengio}, editor = {Zoubin Ghahramani and Max Welling and Corinna Cortes and Neil D. Lawrence and Kilian Q. Weinberger}, title = {Identifying and attacking the saddle point problem in high-dimensional non-convex optimization}, booktitle = {Advances in Neural Information Processing Systems 27: Annual Conference on Neural Information Processing Systems 2014, December 8-13 2014, Montreal, Quebec, Canada}, pages = {2933--2941}, year = {2014}, url = {https://proceedings.neurips.cc/paper/2014/hash/17e23e50bedc63b4095e3d8204ce063b-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/DauphinPGCGB14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/SaxeMG13, author = {Andrew M. Saxe and James L. McClelland and Surya Ganguli}, editor = {Yoshua Bengio and Yann LeCun}, title = {Exact solutions to the nonlinear dynamics of learning in deep linear neural networks}, booktitle = {2nd International Conference on Learning Representations, {ICLR} 2014, Banff, AB, Canada, April 14-16, 2014, Conference Track Proceedings}, year = {2014}, url = {http://arxiv.org/abs/1312.6120}, timestamp = {Thu, 04 Apr 2019 13:20:07 +0200}, biburl = {https://dblp.org/rec/journals/corr/SaxeMG13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/PascanuDGB14, author = {Razvan Pascanu and Yann N. Dauphin and Surya Ganguli and Yoshua Bengio}, title = {On the saddle point problem for non-convex optimization}, journal = {CoRR}, volume = {abs/1405.4604}, year = {2014}, url = {http://arxiv.org/abs/1405.4604}, eprinttype = {arXiv}, eprint = {1405.4604}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/PascanuDGB14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/PooleSG14, author = {Ben Poole and Jascha Sohl{-}Dickstein and Surya Ganguli}, title = {Analyzing noise in autoencoders and deep networks}, journal = {CoRR}, volume = {abs/1406.1831}, year = {2014}, url = {http://arxiv.org/abs/1406.1831}, eprinttype = {arXiv}, eprint = {1406.1831}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/PooleSG14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/DauphinPGCGB14, author = {Yann N. Dauphin and Razvan Pascanu and {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and Kyunghyun Cho and Surya Ganguli and Yoshua Bengio}, title = {Identifying and attacking the saddle point problem in high-dimensional non-convex optimization}, journal = {CoRR}, volume = {abs/1406.2572}, year = {2014}, url = {http://arxiv.org/abs/1406.2572}, eprinttype = {arXiv}, eprint = {1406.2572}, timestamp = {Mon, 22 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/DauphinPGCGB14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cogsci/SaxeMG13, author = {Andrew M. Saxe and James L. McClelland and Surya Ganguli}, editor = {Markus Knauff and Michael Pauen and Natalie Sebanz and Ipke Wachsmuth}, title = {Learning hierarchical categories in deep neural networks}, booktitle = {Proceedings of the 35th Annual Meeting of the Cognitive Science Society, CogSci 2013, Berlin, Germany, July 31 - August 3, 2013}, publisher = {cognitivesciencesociety.org}, year = {2013}, url = {https://escholarship.org/uc/item/2fv5q3hn}, timestamp = {Tue, 30 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cogsci/SaxeMG13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/embc/KaoNSRGS13, author = {Jonathan C. Kao and Paul Nuyujukian and Sergey D. Stavisky and Stephen I. Ryu and Surya Ganguli and Krishna V. Shenoy}, title = {Investigating the role of firing-rate normalization and dimensionality reduction in brain-machine interface robustness}, booktitle = {35th Annual International Conference of the {IEEE} Engineering in Medicine and Biology Society, {EMBC} 2013, Osaka, Japan, July 3-7, 2013}, pages = {293--298}, publisher = {{IEEE}}, year = {2013}, url = {https://doi.org/10.1109/EMBC.2013.6609495}, doi = {10.1109/EMBC.2013.6609495}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/embc/KaoNSRGS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LahiriG13, author = {Subhaneil Lahiri and Surya Ganguli}, editor = {Christopher J. C. Burges and L{\'{e}}on Bottou and Zoubin Ghahramani and Kilian Q. Weinberger}, title = {A memory frontier for complex synapses}, booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual Conference on Neural Information Processing Systems 2013. Proceedings of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States}, pages = {1034--1042}, year = {2013}, url = {https://proceedings.neurips.cc/paper/2013/hash/7f24d240521d99071c93af3917215ef7-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/LahiriG13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/Sohl-DicksteinPG13, author = {Jascha Sohl{-}Dickstein and Ben Poole and Surya Ganguli}, title = {An adaptive low dimensional quasi-Newton sum of functions optimizer}, journal = {CoRR}, volume = {abs/1311.2115}, year = {2013}, url = {http://arxiv.org/abs/1311.2115}, eprinttype = {arXiv}, eprint = {1311.2115}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/Sohl-DicksteinPG13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/GanguliS10, author = {Surya Ganguli and Haim Sompolinsky}, editor = {John D. Lafferty and Christopher K. I. Williams and John Shawe{-}Taylor and Richard S. Zemel and Aron Culotta}, title = {Short-term memory in neuronal networks through dynamical compressed sensing}, booktitle = {Advances in Neural Information Processing Systems 23: 24th Annual Conference on Neural Information Processing Systems 2010. Proceedings of a meeting held 6-9 December 2010, Vancouver, British Columbia, Canada}, pages = {667--675}, publisher = {Curran Associates, Inc.}, year = {2010}, url = {https://proceedings.neurips.cc/paper/2010/hash/0f2c9a93eea6f38fabb3acb1c31488c6-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/GanguliS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.