Managing KV Cache for Coordinated Waiting and Execution Time in LLM Serving. Shen, H., Sen, T., & Tanaka, M In The Proceedings of the 35th International Conference on Computer Communications and Networks (ICCCN 2026), Honolulu, Hawaii, USA, July, 2026.
bibtex   
@inproceedings{shen_managing_2026,
	address = {Honolulu, Hawaii, USA},
	title = {Managing {KV} {Cache} for {Coordinated} {Waiting} and {Execution} {Time} in {LLM} {Serving}},
	booktitle = {The {Proceedings} of the 35th {International} {Conference} on {Computer} {Communications} and {Networks} ({ICCCN} 2026)},
	author = {Shen, Haiying and Sen, Tanmoy and Tanaka, M},
	month = jul,
	year = {2026},
	keywords = {Foundational, SYS: CosmicAI Contact Author, WG: Explorable},
}

Downloads: 0