BibTeX record journals/corr/abs-2401-08383

download as .bib file

@article{DBLP:journals/corr/abs-2401-08383,
  author       = {Jinghan Yao and
                  Quentin Anthony and
                  Aamir Shafi and
                  Hari Subramoni and
                  Dhabaleswar K. Panda},
  title        = {Exploiting Inter-Layer Expert Affinity for Accelerating Mixture-of-Experts
                  Model Inference},
  journal      = {CoRR},
  volume       = {abs/2401.08383},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.08383},
  doi          = {10.48550/ARXIV.2401.08383},
  eprinttype    = {arXiv},
  eprint       = {2401.08383},
  timestamp    = {Thu, 01 Feb 2024 15:35:36 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-08383.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics