diff --git a/vllm/config/compilation.py b/vllm/config/compilation.py index e65728ba7f4e..4209f3a9731c 100644 --- a/vllm/config/compilation.py +++ b/vllm/config/compilation.py @@ -709,9 +709,7 @@ def is_attention_compiled_piecewise(self) -> bool: return self.level == CompilationLevel.PIECEWISE # Inductor partition case - return ( - self.level > CompilationLevel.NO_COMPILATION and self.backend == "inductor" - ) + return self.level > CompilationLevel.NO_COMPILATION and self.use_inductor def custom_op_log_check(self): """