Beyond Tokens: Semantic-Aware Speculative Decoding for Efficient Inference by Probing Internal States. Dong, X., Wang, S., Lin, D., Chen, B., & Hassan, A. E. CoRR, 2026.
Beyond Tokens: Semantic-Aware Speculative Decoding for Efficient Inference by Probing Internal States [link]Paper  doi  bibtex   
@article{DBLP:journals/corr/abs-2602-03708,
  author       = {Ximing Dong and
                  Shaowei Wang and
                  Dayi Lin and
                  Boyuan Chen and
                  Ahmed E. Hassan},
  title        = {Beyond Tokens: Semantic-Aware Speculative Decoding for Efficient Inference
                  by Probing Internal States},
  journal      = {CoRR},
  volume       = {abs/2602.03708},
  year         = {2026},
  url          = {https://doi.org/10.48550/arXiv.2602.03708},
  doi          = {10.48550/ARXIV.2602.03708},
  eprinttype    = {arXiv},
  eprint       = {2602.03708},
  timestamp    = {Fri, 13 Mar 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2602-03708.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0