Skip to content

Commit

Permalink
revert changes to v0 model runner
Browse files Browse the repository at this point in the history
  • Loading branch information
Varun Sundar Rabindranath committed Nov 22, 2024
1 parent 191afc8 commit 3cdc02d
Showing 1 changed file with 1 addition and 5 deletions.
6 changes: 1 addition & 5 deletions vllm/worker/model_runner.py
Original file line number Diff line number Diff line change
Expand Up @@ -917,8 +917,7 @@ def build(self) -> ModelInputForGPU:
lora_mapping = LoRAMapping(
**dict(index_mapping=lora_index_mapping,
prompt_mapping=lora_prompt_mapping,
is_prefill = False))
#is_prefill=not self.decode_only))
is_prefill=not self.decode_only))

# Prompt adapter data.
prompt_adapter_requests: Set[PromptAdapterRequest] = set()
Expand Down Expand Up @@ -1613,9 +1612,6 @@ def execute_model(
if self.lora_config:
assert model_input.lora_requests is not None
assert model_input.lora_mapping is not None
#print (f" index mapping : {len(model_input.lora_mapping.index_mapping)} {model_input.lora_mapping.index_mapping}")
#print (f" prompt mapping : {len(model_input.lora_mapping.prompt_mapping)} {model_input.lora_mapping.prompt_mapping}")
#print (f" # lora requests : {len(model_input.lora_requests)}")
self.set_active_loras(model_input.lora_requests,
model_input.lora_mapping)

Expand Down

0 comments on commit 3cdc02d

Please sign in to comment.