{"_id":"9FiyWW7WoqGzJX36G","bibbaseid":"pope-douglas-chowdhery-devlin-bradbury-heek-xiao-agrawal-etal-efficientlyscalingtransformerinference-2023","author_short":["Pope, R.","Douglas, S.","Chowdhery, A.","Devlin, J.","Bradbury, J.","Heek, J.","Xiao, K.","Agrawal, S.","Dean, J."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Reiner"],"propositions":[],"lastnames":["Pope"],"suffixes":[]},{"firstnames":["Sholto"],"propositions":[],"lastnames":["Douglas"],"suffixes":[]},{"firstnames":["Aakanksha"],"propositions":[],"lastnames":["Chowdhery"],"suffixes":[]},{"firstnames":["Jacob"],"propositions":[],"lastnames":["Devlin"],"suffixes":[]},{"firstnames":["James"],"propositions":[],"lastnames":["Bradbury"],"suffixes":[]},{"firstnames":["Jonathan"],"propositions":[],"lastnames":["Heek"],"suffixes":[]},{"firstnames":["Kefan"],"propositions":[],"lastnames":["Xiao"],"suffixes":[]},{"firstnames":["Shivani"],"propositions":[],"lastnames":["Agrawal"],"suffixes":[]},{"firstnames":["Jeff"],"propositions":[],"lastnames":["Dean"],"suffixes":[]}],"title":"Efficiently Scaling Transformer Inference","booktitle":"Proceedings of the Sixth Conference on Machine Learning and Systems, MLSys 2023, Miami, FL, USA, June 4-8, 2023","year":"2023","crossref":"DBLP:conf/mlsys/2023","url":"https://proceedings.mlsys.org/paper\\_files/paper/2023/hash/c4be71ab8d24cdfb45e3d06dbfca2780-Abstract-mlsys2023.html","timestamp":"Fri, 28 Jun 2024 10:41:31 +0200","biburl":"https://dblp.org/rec/conf/mlsys/PopeDCDBHXAD23.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@inproceedings{DBLP:conf/mlsys/PopeDCDBHXAD23,\n author = {Reiner Pope and\n Sholto Douglas and\n Aakanksha Chowdhery and\n Jacob Devlin and\n James Bradbury and\n Jonathan Heek and\n Kefan Xiao and\n Shivani Agrawal and\n Jeff Dean},\n title = {Efficiently Scaling Transformer Inference},\n booktitle = {Proceedings of the Sixth Conference on Machine Learning and Systems,\n MLSys 2023, Miami, FL, USA, June 4-8, 2023},\n year = {2023},\n crossref = {DBLP:conf/mlsys/2023},\n url = {https://proceedings.mlsys.org/paper\\_files/paper/2023/hash/c4be71ab8d24cdfb45e3d06dbfca2780-Abstract-mlsys2023.html},\n timestamp = {Fri, 28 Jun 2024 10:41:31 +0200},\n biburl = {https://dblp.org/rec/conf/mlsys/PopeDCDBHXAD23.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Pope, R.","Douglas, S.","Chowdhery, A.","Devlin, J.","Bradbury, J.","Heek, J.","Xiao, K.","Agrawal, S.","Dean, J."],"key":"DBLP:conf/mlsys/PopeDCDBHXAD23","id":"DBLP:conf/mlsys/PopeDCDBHXAD23","bibbaseid":"pope-douglas-chowdhery-devlin-bradbury-heek-xiao-agrawal-etal-efficientlyscalingtransformerinference-2023","role":"author","urls":{"Paper":"https://proceedings.mlsys.org/paper\\_files/paper/2023/hash/c4be71ab8d24cdfb45e3d06dbfca2780-Abstract-mlsys2023.html"},"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"http://dblp.org/pers/tb2/d/Dean:Jeffrey","dataSources":["rMEZSGRpGTSfEZaHM"],"keywords":[],"search_terms":["efficiently","scaling","transformer","inference","pope","douglas","chowdhery","devlin","bradbury","heek","xiao","agrawal","dean"],"title":"Efficiently Scaling Transformer Inference","year":2023}