Efficiently Scaling Transformer Inference. Pope, R., Douglas, S., Chowdhery, A., Devlin, J., Bradbury, J., Heek, J., Xiao, K., Agrawal, S., & Dean, J. In Proceedings of the Sixth Conference on Machine Learning and Systems, MLSys 2023, Miami, FL, USA, June 4-8, 2023, 2023.
Efficiently Scaling Transformer Inference [link]Paper  bibtex   
@inproceedings{DBLP:conf/mlsys/PopeDCDBHXAD23,
  author       = {Reiner Pope and
                  Sholto Douglas and
                  Aakanksha Chowdhery and
                  Jacob Devlin and
                  James Bradbury and
                  Jonathan Heek and
                  Kefan Xiao and
                  Shivani Agrawal and
                  Jeff Dean},
  title        = {Efficiently Scaling Transformer Inference},
  booktitle    = {Proceedings of the Sixth Conference on Machine Learning and Systems,
                  MLSys 2023, Miami, FL, USA, June 4-8, 2023},
  year         = {2023},
  crossref     = {DBLP:conf/mlsys/2023},
  url          = {https://proceedings.mlsys.org/paper\_files/paper/2023/hash/c4be71ab8d24cdfb45e3d06dbfca2780-Abstract-mlsys2023.html},
  timestamp    = {Fri, 28 Jun 2024 10:41:31 +0200},
  biburl       = {https://dblp.org/rec/conf/mlsys/PopeDCDBHXAD23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0