BibTeX record conf/nsdi/ZuGDT0HBKRDLWWL24

download as .bib file

@inproceedings{DBLP:conf/nsdi/ZuGDT0HBKRDLWWL24,
  author       = {Yazhou Zu and
                  Alireza Ghaffarkhah and
                  Hoang{-}Vu Dang and
                  Brian Towles and
                  Steven Hand and
                  Safeen Huda and
                  Adekunle Bello and
                  Alexander Kolbasov and
                  Arash Rezaei and
                  Dayou Du and
                  Steve Lacy and
                  Hang Wang and
                  Aaron Wisner and
                  Chris Lewis and
                  Henri Bahini},
  editor       = {Laurent Vanbever and
                  Irene Zhang},
  title        = {Resiliency at Scale: Managing Google's TPUv4 Machine Learning Supercomputer},
  booktitle    = {21st {USENIX} Symposium on Networked Systems Design and Implementation,
                  {NSDI} 2024, Santa Clara, CA, April 15-17, 2024},
  pages        = {761--774},
  publisher    = {{USENIX} Association},
  year         = {2024},
  url          = {https://www.usenix.org/conference/nsdi24/presentation/zu},
  timestamp    = {Fri, 19 Apr 2024 16:22:18 +0200},
  biburl       = {https://dblp.org/rec/conf/nsdi/ZuGDT0HBKRDLWWL24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics