We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d71bde4 commit a434a2fCopy full SHA for a434a2f
vllm/v1/core/sched/scheduler.py
@@ -474,6 +474,7 @@ def schedule(self) -> SchedulerOutput:
474
# pooling requests to be chunked
475
if (
476
not self.scheduler_config.chunked_prefill_enabled
477
+ and not self.scheduler_config.enable_hybrid_chunked_prefill
478
and num_new_tokens > token_budget
479
):
480
self.waiting.pop_request()
0 commit comments