Towards Cross-Tokenizer Distillation: the Universal Logit Distillation Loss for LLMs. Boizard, N., Haddad, K. E., Hudelot, C., & Colombo, P. CoRR, 2024.
Paper doi bibtex @article{DBLP:journals/corr/abs-2402-12030,
author = {Nicolas Boizard and
Kevin El Haddad and
C{\'{e}}line Hudelot and
Pierre Colombo},
title = {Towards Cross-Tokenizer Distillation: the Universal Logit Distillation
Loss for LLMs},
journal = {CoRR},
volume = {abs/2402.12030},
year = {2024},
url = {https://doi.org/10.48550/arXiv.2402.12030},
doi = {10.48550/ARXIV.2402.12030},
eprinttype = {arXiv},
eprint = {2402.12030},
timestamp = {Thu, 21 Mar 2024 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2402-12030.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"2B4KsuK3pRRYn5MbB","bibbaseid":"boizard-haddad-hudelot-colombo-towardscrosstokenizerdistillationtheuniversallogitdistillationlossforllms-2024","author_short":["Boizard, N.","Haddad, K. E.","Hudelot, C.","Colombo, P."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Nicolas"],"propositions":[],"lastnames":["Boizard"],"suffixes":[]},{"firstnames":["Kevin","El"],"propositions":[],"lastnames":["Haddad"],"suffixes":[]},{"firstnames":["Céline"],"propositions":[],"lastnames":["Hudelot"],"suffixes":[]},{"firstnames":["Pierre"],"propositions":[],"lastnames":["Colombo"],"suffixes":[]}],"title":"Towards Cross-Tokenizer Distillation: the Universal Logit Distillation Loss for LLMs","journal":"CoRR","volume":"abs/2402.12030","year":"2024","url":"https://doi.org/10.48550/arXiv.2402.12030","doi":"10.48550/ARXIV.2402.12030","eprinttype":"arXiv","eprint":"2402.12030","timestamp":"Thu, 21 Mar 2024 00:00:00 +0100","biburl":"https://dblp.org/rec/journals/corr/abs-2402-12030.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2402-12030,\n author = {Nicolas Boizard and\n Kevin El Haddad and\n C{\\'{e}}line Hudelot and\n Pierre Colombo},\n title = {Towards Cross-Tokenizer Distillation: the Universal Logit Distillation\n Loss for LLMs},\n journal = {CoRR},\n volume = {abs/2402.12030},\n year = {2024},\n url = {https://doi.org/10.48550/arXiv.2402.12030},\n doi = {10.48550/ARXIV.2402.12030},\n eprinttype = {arXiv},\n eprint = {2402.12030},\n timestamp = {Thu, 21 Mar 2024 00:00:00 +0100},\n biburl = {https://dblp.org/rec/journals/corr/abs-2402-12030.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Boizard, N.","Haddad, K. E.","Hudelot, C.","Colombo, P."],"key":"DBLP:journals/corr/abs-2402-12030","id":"DBLP:journals/corr/abs-2402-12030","bibbaseid":"boizard-haddad-hudelot-colombo-towardscrosstokenizerdistillationtheuniversallogitdistillationlossforllms-2024","role":"author","urls":{"Paper":"https://doi.org/10.48550/arXiv.2402.12030"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://dblp.org/pid/229/3167.bib","dataSources":["GXv5EbWSzjLH96rpE","FD6yNzHMPC2zrsvYD"],"keywords":[],"search_terms":["towards","cross","tokenizer","distillation","universal","logit","distillation","loss","llms","boizard","haddad","hudelot","colombo"],"title":"Towards Cross-Tokenizer Distillation: the Universal Logit Distillation Loss for LLMs","year":2024}