We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 62ad56f commit 89f0ca7Copy full SHA for 89f0ca7
vllm/v1/worker/gpu_model_runner.py
@@ -2826,7 +2826,7 @@ def execute_model(
2826
# returns True. before returning early here we call
2827
# dummy run to ensure coordinate_batch_across_dp
2828
# is called into to avoid out of sync issues.
2829
- self._dummy_run(self._get_num_input_tokens(1))
+ self._dummy_run(1)
2830
if not has_kv_transfer_group():
2831
# Return empty ModelRunnerOutput if no work to do.
2832
return EMPTY_MODEL_RUNNER_OUTPUT
0 commit comments