@article{202409.1208, doi = {10.20944/preprints202409.1208.v1}, url = {https://doi.org/10.20944/preprints202409.1208.v1}, year = 2024, month = {September}, publisher = {Preprints}, author = {Adarsh MS and Jithin VG and Ditto PS}, title = {Efficient Hybrid Inference for LLMs: Reward-Based Token Modelling with Selective Cloud Assistance}, journal = {Preprints} }