We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 15c50f7 commit f620ad1Copy full SHA for f620ad1
vllm/v1/engine/core.py
@@ -467,8 +467,16 @@ def step_with_batch_queue(
467
return engine_core_outputs, model_executed
468
469
def _process_aborts_queue(self):
470
- while not self.aborts_queue.empty():
471
- self.abort_requests(self.aborts_queue.get_nowait())
+ if not self.aborts_queue.empty():
+ request_ids = []
472
+ while not self.aborts_queue.empty():
473
+ ids = self.aborts_queue.get_nowait()
474
+ if isinstance(ids, str):
475
+ # Should be a list here, but also handle string just in case.
476
+ ids = (ids,)
477
+ request_ids.extend(ids)
478
+ # More efficient to abort all as a single batch.
479
+ self.abort_requests(request_ids)
480
481
def shutdown(self):
482
self.structured_output_manager.clear_backend()
0 commit comments