PolyServe: Efficient Multi-SLO Serving at Scale. Zhu, K., Shi, H., Xu, L., Shan, J., Krishnamurthy, A., Kasikci, B., & Xie, L. CoRR, 2025.
Paper doi bibtex @article{DBLP:journals/corr/abs-2507-17769,
author = {Kan Zhu and
Haiyang Shi and
Le Xu and
Jiaxin Shan and
Arvind Krishnamurthy and
Baris Kasikci and
Liguang Xie},
title = {PolyServe: Efficient Multi-SLO Serving at Scale},
journal = {CoRR},
volume = {abs/2507.17769},
year = {2025},
url = {https://doi.org/10.48550/arXiv.2507.17769},
doi = {10.48550/ARXIV.2507.17769},
eprinttype = {arXiv},
eprint = {2507.17769},
timestamp = {Mon, 18 Aug 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2507-17769.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"ojdZjQbF2Ar79Gkg3","bibbaseid":"zhu-shi-xu-shan-krishnamurthy-kasikci-xie-polyserveefficientmultisloservingatscale-2025","author_short":["Zhu, K.","Shi, H.","Xu, L.","Shan, J.","Krishnamurthy, A.","Kasikci, B.","Xie, L."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Kan"],"propositions":[],"lastnames":["Zhu"],"suffixes":[]},{"firstnames":["Haiyang"],"propositions":[],"lastnames":["Shi"],"suffixes":[]},{"firstnames":["Le"],"propositions":[],"lastnames":["Xu"],"suffixes":[]},{"firstnames":["Jiaxin"],"propositions":[],"lastnames":["Shan"],"suffixes":[]},{"firstnames":["Arvind"],"propositions":[],"lastnames":["Krishnamurthy"],"suffixes":[]},{"firstnames":["Baris"],"propositions":[],"lastnames":["Kasikci"],"suffixes":[]},{"firstnames":["Liguang"],"propositions":[],"lastnames":["Xie"],"suffixes":[]}],"title":"PolyServe: Efficient Multi-SLO Serving at Scale","journal":"CoRR","volume":"abs/2507.17769","year":"2025","url":"https://doi.org/10.48550/arXiv.2507.17769","doi":"10.48550/ARXIV.2507.17769","eprinttype":"arXiv","eprint":"2507.17769","timestamp":"Mon, 18 Aug 2025 01:00:00 +0200","biburl":"https://dblp.org/rec/journals/corr/abs-2507-17769.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2507-17769,\n author = {Kan Zhu and\n Haiyang Shi and\n Le Xu and\n Jiaxin Shan and\n Arvind Krishnamurthy and\n Baris Kasikci and\n Liguang Xie},\n title = {PolyServe: Efficient Multi-SLO Serving at Scale},\n journal = {CoRR},\n volume = {abs/2507.17769},\n year = {2025},\n url = {https://doi.org/10.48550/arXiv.2507.17769},\n doi = {10.48550/ARXIV.2507.17769},\n eprinttype = {arXiv},\n eprint = {2507.17769},\n timestamp = {Mon, 18 Aug 2025 01:00:00 +0200},\n biburl = {https://dblp.org/rec/journals/corr/abs-2507-17769.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Zhu, K.","Shi, H.","Xu, L.","Shan, J.","Krishnamurthy, A.","Kasikci, B.","Xie, L."],"key":"DBLP:journals/corr/abs-2507-17769","id":"DBLP:journals/corr/abs-2507-17769","bibbaseid":"zhu-shi-xu-shan-krishnamurthy-kasikci-xie-polyserveefficientmultisloservingatscale-2025","role":"author","urls":{"Paper":"https://doi.org/10.48550/arXiv.2507.17769"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://dblp.org/pid/207/3468.bib","dataSources":["7ecbLnRSGBTHkhiqm"],"keywords":[],"search_terms":["polyserve","efficient","multi","slo","serving","scale","zhu","shi","xu","shan","krishnamurthy","kasikci","xie"],"title":"PolyServe: Efficient Multi-SLO Serving at Scale","year":2025}