We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 315068e commit 5cd2377Copy full SHA for 5cd2377
vllm/v1/core/sched/scheduler.py
@@ -355,7 +355,12 @@ def schedule(self) -> SchedulerOutput:
355
while self.waiting and token_budget > 0:
356
if len(self.running) == self.max_num_running_reqs:
357
break
358
-
+ if len(scheduled_resumed_reqs) + len(scheduled_new_reqs) >= max(
359
+ 1,
360
+ self.max_num_running_reqs
361
+ // self.parallel_config.pipeline_parallel_size,
362
+ ):
363
+ break
364
request = self.waiting.peek_request()
365
366
# KVTransfer: skip request if still waiting for remote kvs.
0 commit comments