No Buffer, No Bottleneck: Efficient Zero-Copy KV Cache Offloading for Long-Context LLMs. Luo, S & Shen, H. In The 20th USENIX Symposium on Operating Systems Design and Implementation (OSDI), Seattle, WA, July, 2026.
bibtex   
@inproceedings{luo_no_2026,
	address = {Seattle, WA},
	title = {No {Buffer}, {No} {Bottleneck}: {Efficient} {Zero}-{Copy} {KV} {Cache} {Offloading} for {Long}-{Context} {LLMs}},
	booktitle = {The 20th {USENIX} {Symposium} on {Operating} {Systems} {Design} and {Implementation} ({OSDI})},
	author = {Luo, S and Shen, Haiying},
	month = jul,
	year = {2026},
	keywords = {Foundational, SYS: CosmicAI Contact Author, WG: Explorable},
}

Downloads: 0