Matryoshka Quantization. Nair, P. A., Datta, P., Dean, J., Jain, P., & Kusupati, A. CoRR, 2025.
Paper doi bibtex @article{DBLP:journals/corr/abs-2502-06786,
author = {Pranav Ajit Nair and
Puranjay Datta and
Jeff Dean and
Prateek Jain and
Aditya Kusupati},
title = {Matryoshka Quantization},
journal = {CoRR},
volume = {abs/2502.06786},
year = {2025},
url = {https://doi.org/10.48550/arXiv.2502.06786},
doi = {10.48550/ARXIV.2502.06786},
eprinttype = {arXiv},
eprint = {2502.06786},
timestamp = {Wed, 12 Mar 2025 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2502-06786.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"BEiAACnuYw2GYEb7m","bibbaseid":"nair-datta-dean-jain-kusupati-matryoshkaquantization-2025","author_short":["Nair, P. A.","Datta, P.","Dean, J.","Jain, P.","Kusupati, A."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Pranav","Ajit"],"propositions":[],"lastnames":["Nair"],"suffixes":[]},{"firstnames":["Puranjay"],"propositions":[],"lastnames":["Datta"],"suffixes":[]},{"firstnames":["Jeff"],"propositions":[],"lastnames":["Dean"],"suffixes":[]},{"firstnames":["Prateek"],"propositions":[],"lastnames":["Jain"],"suffixes":[]},{"firstnames":["Aditya"],"propositions":[],"lastnames":["Kusupati"],"suffixes":[]}],"title":"Matryoshka Quantization","journal":"CoRR","volume":"abs/2502.06786","year":"2025","url":"https://doi.org/10.48550/arXiv.2502.06786","doi":"10.48550/ARXIV.2502.06786","eprinttype":"arXiv","eprint":"2502.06786","timestamp":"Wed, 12 Mar 2025 00:00:00 +0100","biburl":"https://dblp.org/rec/journals/corr/abs-2502-06786.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2502-06786,\n author = {Pranav Ajit Nair and\n Puranjay Datta and\n Jeff Dean and\n Prateek Jain and\n Aditya Kusupati},\n title = {Matryoshka Quantization},\n journal = {CoRR},\n volume = {abs/2502.06786},\n year = {2025},\n url = {https://doi.org/10.48550/arXiv.2502.06786},\n doi = {10.48550/ARXIV.2502.06786},\n eprinttype = {arXiv},\n eprint = {2502.06786},\n timestamp = {Wed, 12 Mar 2025 00:00:00 +0100},\n biburl = {https://dblp.org/rec/journals/corr/abs-2502-06786.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Nair, P. A.","Datta, P.","Dean, J.","Jain, P.","Kusupati, A."],"key":"DBLP:journals/corr/abs-2502-06786","id":"DBLP:journals/corr/abs-2502-06786","bibbaseid":"nair-datta-dean-jain-kusupati-matryoshkaquantization-2025","role":"author","urls":{"Paper":"https://doi.org/10.48550/arXiv.2502.06786"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"http://dblp.org/pers/tb2/d/Dean:Jeffrey","dataSources":["rMEZSGRpGTSfEZaHM"],"keywords":[],"search_terms":["matryoshka","quantization","nair","datta","dean","jain","kusupati"],"title":"Matryoshka Quantization","year":2025}