Skip to content

Commit

Permalink
Fix format
Browse files Browse the repository at this point in the history
  • Loading branch information
sroy745 committed Dec 2, 2024
1 parent e19f99b commit 40f4ce2
Showing 1 changed file with 2 additions and 0 deletions.
2 changes: 2 additions & 0 deletions vllm/v1/worker/gpu_model_runner.py
Original file line number Diff line number Diff line change
Expand Up @@ -610,6 +610,7 @@ class CachedRequestState:
mm_positions: List["PlaceholderRange"]
sampling_params: SamplingParams
generator: Optional[torch.Generator]

block_ids: List[int]
num_computed_tokens: int
output_token_ids: List[int]
Expand All @@ -618,6 +619,7 @@ class CachedRequestState:
def num_tokens(self) -> int:
return len(self.prompt_token_ids) + len(self.output_token_ids)


class InputBatch:

def __init__(
Expand Down

0 comments on commit 40f4ce2

Please sign in to comment.