Skip to content

Commit 01c30f6

Browse files
authored
Fix schedule error in splitwise deployment (#5149)
1 parent 147b2e5 commit 01c30f6

File tree

2 files changed

+3
-1
lines changed

2 files changed

+3
-1
lines changed

fastdeploy/engine/sched/resource_manager_v1.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -514,6 +514,8 @@ def schedule(self):
514514
error_reqs: list[tuple[str, str]] = []
515515
token_budget = self.config.scheduler_config.max_num_batched_tokens
516516

517+
self.check_and_free_block_tables()
518+
517519
# First, schedule the RUNNING requests.
518520
req_index = 0
519521
num_decoding_req_nums = 0

fastdeploy/scheduler/local_scheduler.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -285,7 +285,7 @@ def get_requests(
285285
if short_partial_requests + long_partial_requests > self.max_num_partial_prefills:
286286
break
287287
else:
288-
if current_prefill_tokens > max_num_batched_tokens:
288+
if current_prefill_tokens > max_num_batched_tokens and len(requests) > 0:
289289
break
290290
requests.append(request.raw)
291291

0 commit comments

Comments
 (0)