Revert "Fix for Spec model TP + Chunked Prefill"

This reverts commit 6863d1f. Signed-off-by: andoorve <[email protected]>
vllm-project · Nov 12, 2024 · 902daaa · 902daaa
1 parent 6863d1f
commit 902daaa
Showing 1 changed file with 0 additions and 6 deletions.
diff --git a/vllm/spec_decode/spec_decode_worker.py b/vllm/spec_decode/spec_decode_worker.py
@@ -641,12 +641,6 @@ def _run_non_driver_rank(self) -> bool:
         # that the hidden states can be propagated to proposer when needed.
         if data["no_spec"]:
             self.scorer_worker.execute_model()
-            # If no spec case we still want to run the proposer model
-            # but ONLY once to match `not skip_proposer` in
-            # driver `_run_no_spec`
-            if not data["disable_all_speculation"]:
-                self.proposer_worker.execute_model()
-            return True
 
         if not data["disable_all_speculation"]:
             # Even if num_lookahead_slots is zero, we want to run the