diff --git a/vllm/spec_decode/spec_decode_worker.py b/vllm/spec_decode/spec_decode_worker.py index 8f3c824c4d2c3..b279931ca4b02 100644 --- a/vllm/spec_decode/spec_decode_worker.py +++ b/vllm/spec_decode/spec_decode_worker.py @@ -417,7 +417,7 @@ def execute_model( all_zero_spec_tokens = all_zero_spec_tokens and ( sgm.num_speculative_tokens == 0) - if all_prompt: + if all_prompt and execute_model_req.seq_group_metadata_list: assert num_lookahead_slots == 0, ( "Prompt only runs should have num_lookahead_slots equal to 0. " "This should never happen, please file a bug at "