RAEE: A Training-Free Retrieval-Augmented Early Exiting Framework for Efficient Inference. Huang, L., Wu, S., Cui, Y., Xiong, Y., Liu, X., Kuo, T., Guan, N., & Xue, C. J. CoRR, 2024. Paper doi bibtex @article{DBLP:journals/corr/abs-2405-15198,
author = {Lianming Huang and
Shangyu Wu and
Yufei Cui and
Ying Xiong and
Xue Liu and
Tei{-}Wei Kuo and
Nan Guan and
Chun Jason Xue},
title = {{RAEE:} {A} Training-Free Retrieval-Augmented Early Exiting Framework
for Efficient Inference},
journal = {CoRR},
volume = {abs/2405.15198},
year = {2024},
url = {https://doi.org/10.48550/arXiv.2405.15198},
doi = {10.48550/ARXIV.2405.15198},
eprinttype = {arXiv},
eprint = {2405.15198},
timestamp = {Wed, 19 Jun 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2405-15198.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"SwwP5GcSowHnnwTsW","bibbaseid":"huang-wu-cui-xiong-liu-kuo-guan-xue-raeeatrainingfreeretrievalaugmentedearlyexitingframeworkforefficientinference-2024","author_short":["Huang, L.","Wu, S.","Cui, Y.","Xiong, Y.","Liu, X.","Kuo, T.","Guan, N.","Xue, C. J."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Lianming"],"propositions":[],"lastnames":["Huang"],"suffixes":[]},{"firstnames":["Shangyu"],"propositions":[],"lastnames":["Wu"],"suffixes":[]},{"firstnames":["Yufei"],"propositions":[],"lastnames":["Cui"],"suffixes":[]},{"firstnames":["Ying"],"propositions":[],"lastnames":["Xiong"],"suffixes":[]},{"firstnames":["Xue"],"propositions":[],"lastnames":["Liu"],"suffixes":[]},{"firstnames":["Tei-Wei"],"propositions":[],"lastnames":["Kuo"],"suffixes":[]},{"firstnames":["Nan"],"propositions":[],"lastnames":["Guan"],"suffixes":[]},{"firstnames":["Chun","Jason"],"propositions":[],"lastnames":["Xue"],"suffixes":[]}],"title":"RAEE: A Training-Free Retrieval-Augmented Early Exiting Framework for Efficient Inference","journal":"CoRR","volume":"abs/2405.15198","year":"2024","url":"https://doi.org/10.48550/arXiv.2405.15198","doi":"10.48550/ARXIV.2405.15198","eprinttype":"arXiv","eprint":"2405.15198","timestamp":"Wed, 19 Jun 2024 01:00:00 +0200","biburl":"https://dblp.org/rec/journals/corr/abs-2405-15198.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2405-15198,\n author = {Lianming Huang and\n Shangyu Wu and\n Yufei Cui and\n Ying Xiong and\n Xue Liu and\n Tei{-}Wei Kuo and\n Nan Guan and\n Chun Jason Xue},\n title = {{RAEE:} {A} Training-Free Retrieval-Augmented Early Exiting Framework\n for Efficient Inference},\n journal = {CoRR},\n volume = {abs/2405.15198},\n year = {2024},\n url = {https://doi.org/10.48550/arXiv.2405.15198},\n doi = {10.48550/ARXIV.2405.15198},\n eprinttype = {arXiv},\n eprint = {2405.15198},\n timestamp = {Wed, 19 Jun 2024 01:00:00 +0200},\n biburl = {https://dblp.org/rec/journals/corr/abs-2405-15198.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Huang, L.","Wu, S.","Cui, Y.","Xiong, Y.","Liu, X.","Kuo, T.","Guan, N.","Xue, C. J."],"key":"DBLP:journals/corr/abs-2405-15198","id":"DBLP:journals/corr/abs-2405-15198","bibbaseid":"huang-wu-cui-xiong-liu-kuo-guan-xue-raeeatrainingfreeretrievalaugmentedearlyexitingframeworkforefficientinference-2024","role":"author","urls":{"paper":"https://doi.org/10.48550/arXiv.2405.15198"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://dblp.org/pid/x/ChunJasonXue.bib","dataSources":["Zmgr4hiaLbNyiBeRm"],"keywords":[],"search_terms":["raee","training","free","retrieval","augmented","early","exiting","framework","efficient","inference","huang","wu","cui","xiong","liu","kuo","guan","xue"],"title":"RAEE: A Training-Free Retrieval-Augmented Early Exiting Framework for Efficient Inference","year":2024}