@Inproceedings{ Chen25-INFOCOM, author = {Fahao Chen and Peng Li and Tom H. Luand and Zhou Su and Jing Deng}, title = {SPIN: Accelerating Large Language Model Inference with Heterogeneous Speculative Models}, booktitle = {Proc. of the 44th IEEE Conference of Computer Communications (INFOCOM '25)}, month = {May 19-22}, year = {2025}, pages = {1-10}, volume = {}, address = {London, U. K.}, doi = {10.1109/INFOCOM55648.2025.11044522} }