We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 147b2e5 commit 01c30f6Copy full SHA for 01c30f6
fastdeploy/engine/sched/resource_manager_v1.py
@@ -514,6 +514,8 @@ def schedule(self):
514
error_reqs: list[tuple[str, str]] = []
515
token_budget = self.config.scheduler_config.max_num_batched_tokens
516
517
+ self.check_and_free_block_tables()
518
+
519
# First, schedule the RUNNING requests.
520
req_index = 0
521
num_decoding_req_nums = 0
fastdeploy/scheduler/local_scheduler.py
@@ -285,7 +285,7 @@ def get_requests(
285
if short_partial_requests + long_partial_requests > self.max_num_partial_prefills:
286
break
287
else:
288
- if current_prefill_tokens > max_num_batched_tokens:
+ if current_prefill_tokens > max_num_batched_tokens and len(requests) > 0:
289
290
requests.append(request.raw)
291
0 commit comments