Skip to content

Commit

Permalink
updated
Browse files Browse the repository at this point in the history
  • Loading branch information
robertgshaw2-redhat committed Nov 17, 2024
1 parent 63b301a commit 1af03e0
Showing 1 changed file with 0 additions and 10 deletions.
10 changes: 0 additions & 10 deletions vllm/v1/worker/tpu_model_runner.py
Original file line number Diff line number Diff line change
Expand Up @@ -257,10 +257,6 @@ def _prepare_prefill_inputs(
context_lens=None,
))

print(f"PREFILL {token_ids.shape=}")
print(f"PREFILL {positions.shape=}")
print(f"PREFILL {slot_mapping.shape=}")

return PrefillInputData(
request_ids=prefill_request_ids,
prompt_lens=prefill_prompt_lens,
Expand Down Expand Up @@ -319,12 +315,6 @@ def _prepare_decode_inputs(self, num_decodes: int) -> DecodeInputData:
# CONTEXT_LENS [batch_size]
context_lens = (positions.reshape(-1) + 1)

print(f"{token_ids.shape=}")
print(f"{positions.shape=}")
print(f"{slot_mapping.shape=}")
print(f"{block_table.shape=}")
print(f"{context_lens.shape=}")

# CPU<>TPU sync happens here.
return DecodeInputData(num_decodes=num_decodes,
token_ids=token_ids.to(self.device),
Expand Down

0 comments on commit 1af03e0

Please sign in to comment.