diff --git a/vllm/worker/hpu_model_runner.py b/vllm/worker/hpu_model_runner.py index a343e2fedb23..e2261cbb26b4 100644 --- a/vllm/worker/hpu_model_runner.py +++ b/vllm/worker/hpu_model_runner.py @@ -1554,10 +1554,8 @@ def warmup_model(self, kv_caches: List[torch.Tensor]) -> None: 'Please update Gaudi Software Suite.') with compile_only_mode_context( ) if can_use_compile_only_mode else contextlib.nullcontext(): - print("aa") self.warmup_all_buckets(self.bucketing_ctx.prompt_buckets, True, kv_caches) - print("bb") self.warmup_all_buckets(self.bucketing_ctx.decode_buckets, False, kv_caches)