BibTeX record journals/corr/abs-2110-03888

download as .bib file

@article{DBLP:journals/corr/abs-2110-03888,
  author       = {Junyang Lin and
                  An Yang and
                  Jinze Bai and
                  Chang Zhou and
                  Le Jiang and
                  Xianyan Jia and
                  Ang Wang and
                  Jie Zhang and
                  Yong Li and
                  Wei Lin and
                  Jingren Zhou and
                  Hongxia Yang},
  title        = {{M6-10T:} {A} Sharing-Delinking Paradigm for Efficient Multi-Trillion
                  Parameter Pretraining},
  journal      = {CoRR},
  volume       = {abs/2110.03888},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.03888},
  eprinttype    = {arXiv},
  eprint       = {2110.03888},
  timestamp    = {Mon, 22 Jul 2024 08:24:23 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-03888.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics