diff --git a/vllm/v1/worker/gpu_worker.py b/vllm/v1/worker/gpu_worker.py index f59dacf13d85..d510f28ce408 100644 --- a/vllm/v1/worker/gpu_worker.py +++ b/vllm/v1/worker/gpu_worker.py @@ -489,7 +489,7 @@ def profile(self, is_start: bool = True): sort_by="self_cuda_time_total")) def execute_dummy_batch(self) -> None: - self.model_runner._dummy_run(1, uniform_decode=True) + self.model_runner._dummy_run(1) def add_lora(self, lora_request: LoRARequest) -> bool: return self.model_runner.add_lora(lora_request)