Skip to content

Commit

Permalink
change resuming policy TODO to right pos
Browse files Browse the repository at this point in the history
  • Loading branch information
jiange91 committed Aug 15, 2023
1 parent 7041160 commit 5eb4f55
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 5 deletions.
5 changes: 4 additions & 1 deletion vllm/core/scheduler.py
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,10 @@ def get_paused_seq_group(self, request_id: str) \
else:
raise ValueError(f"No paused request with request id {request_id}")

# TODO: add logic for other two modes
# TODO: (Need discussion) different policy of resuming APIs:
# 1. (implememted) API with preserve mode: FCFS in the running group
# 2. (?) API with recompute mode: First in the waiting group
# 3. (?) API with swap mode: FCFS in the swapped group
def resume_seq_group(self, request_id: str) -> None:
seq_group, mode = self.get_paused_seq_group(request_id)
del self.paused[request_id]
Expand Down
4 changes: 0 additions & 4 deletions vllm/engine/llm_engine.py
Original file line number Diff line number Diff line change
Expand Up @@ -276,10 +276,6 @@ def resume_request(self,
seq_group.clear_and_set(seqs)
self.scheduler.resume_seq_group(request_id)

# TODO: (Need discussion) different policy of resuming APIs, currently is
# 1. API with preserve mode: FCFS in the running group
# 2. (?) API with recompute mode: First in the waiting group
# 3. (?) API with swap mode: FCFS in the swapped group
# NOTE: seq_id_2_api_rel is to support multiple API calls in a SeqGroup
# need mapping seq_id -> API tokens to append result to the right seq
def new_resume_request(self, request_id: str,
Expand Down

0 comments on commit 5eb4f55

Please sign in to comment.