This repository contains the source code implementation of the arXiv paper Fail Fast, Win Big: Rethinking the Drafting Strategy in Speculative Decoding via Diffusion LLMs.
Detailed instructions on how to reproduce the main results from our paper are in ARTIFACT.md.
@article{pan2025failfast,
title={Fail Fast, Win Big: Rethinking the Drafting Strategy in Speculative Decoding via Diffusion LLMs},
author={Pan, Rui and Chen, Zhuofu and Liu, Hongyi and Krishnamurthy, Arvind and Netravali, Ravi},
journal={arXiv preprint arXiv:2512.20573},
year={2025}
}