The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits

The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits. Ma, S., Wang, H., Ma, L., Wang, L., Wang, W., Huang, S., Dong, L., Wang, R., Xue, J., & Wei, F. CoRR, 2024.

Paper doi bibtex

@article{DBLP:journals/corr/abs-2402-17764,
  author       = {Shuming Ma and
                  Hongyu Wang and
                  Lingxiao Ma and
                  Lei Wang and
                  Wenhui Wang and
                  Shaohan Huang and
                  Li Dong and
                  Ruiping Wang and
                  Jilong Xue and
                  Furu Wei},
  title        = {The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits},
  journal      = {CoRR},
  volume       = {abs/2402.17764},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.17764},
  doi          = {10.48550/ARXIV.2402.17764},
  eprinttype    = {arXiv},
  eprint       = {2402.17764},
  timestamp    = {Fri, 19 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-17764.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0

{"_id":"TamTt8wTGvz4podCF","bibbaseid":"ma-wang-ma-wang-wang-huang-dong-wang-etal-theeraof1bitllmsalllargelanguagemodelsarein158bits-2024","author_short":["Ma, S.","Wang, H.","Ma, L.","Wang, L.","Wang, W.","Huang, S.","Dong, L.","Wang, R.","Xue, J.","Wei, F."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Shuming"],"propositions":[],"lastnames":["Ma"],"suffixes":[]},{"firstnames":["Hongyu"],"propositions":[],"lastnames":["Wang"],"suffixes":[]},{"firstnames":["Lingxiao"],"propositions":[],"lastnames":["Ma"],"suffixes":[]},{"firstnames":["Lei"],"propositions":[],"lastnames":["Wang"],"suffixes":[]},{"firstnames":["Wenhui"],"propositions":[],"lastnames":["Wang"],"suffixes":[]},{"firstnames":["Shaohan"],"propositions":[],"lastnames":["Huang"],"suffixes":[]},{"firstnames":["Li"],"propositions":[],"lastnames":["Dong"],"suffixes":[]},{"firstnames":["Ruiping"],"propositions":[],"lastnames":["Wang"],"suffixes":[]},{"firstnames":["Jilong"],"propositions":[],"lastnames":["Xue"],"suffixes":[]},{"firstnames":["Furu"],"propositions":[],"lastnames":["Wei"],"suffixes":[]}],"title":"The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits","journal":"CoRR","volume":"abs/2402.17764","year":"2024","url":"https://doi.org/10.48550/arXiv.2402.17764","doi":"10.48550/ARXIV.2402.17764","eprinttype":"arXiv","eprint":"2402.17764","timestamp":"Fri, 19 Jul 2024 01:00:00 +0200","biburl":"https://dblp.org/rec/journals/corr/abs-2402-17764.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2402-17764,\n author = {Shuming Ma and\n Hongyu Wang and\n Lingxiao Ma and\n Lei Wang and\n Wenhui Wang and\n Shaohan Huang and\n Li Dong and\n Ruiping Wang and\n Jilong Xue and\n Furu Wei},\n title = {The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits},\n journal = {CoRR},\n volume = {abs/2402.17764},\n year = {2024},\n url = {https://doi.org/10.48550/arXiv.2402.17764},\n doi = {10.48550/ARXIV.2402.17764},\n eprinttype = {arXiv},\n eprint = {2402.17764},\n timestamp = {Fri, 19 Jul 2024 01:00:00 +0200},\n biburl = {https://dblp.org/rec/journals/corr/abs-2402-17764.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Ma, S.","Wang, H.","Ma, L.","Wang, L.","Wang, W.","Huang, S.","Dong, L.","Wang, R.","Xue, J.","Wei, F."],"key":"DBLP:journals/corr/abs-2402-17764","id":"DBLP:journals/corr/abs-2402-17764","bibbaseid":"ma-wang-ma-wang-wang-huang-dong-wang-etal-theeraof1bitllmsalllargelanguagemodelsarein158bits-2024","role":"author","urls":{"Paper":"https://doi.org/10.48550/arXiv.2402.17764"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://dblp.org/pid/176/0380.bib","dataSources":["zbFJei64gwybfvHiC"],"keywords":[],"search_terms":["era","bit","llms","large","language","models","bits","ma","wang","ma","wang","wang","huang","dong","wang","xue","wei"],"title":"The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits","year":2024}