Fix inductor config

ilmarkov · ilmarkov · commit 7bded2954c2d · 2025-10-28T13:26:59.000Z
Signed-off-by: ilmarkov &lt;markovilya197@gmail.com&gt;
diff --git a/vllm/compilation/backends.py b/vllm/compilation/backends.py
@@ -225,7 +225,12 @@ def compile(
             # Let compile_fx generate a key for us
             maybe_key = None
         else:
-            maybe_key = f"artifact_compile_range_{compile_range}_subgraph_{graph_index}"
+            maybe_key = "artifact_compile_range_"
+            if compile_range is None:
+                maybe_key += "dynamic_shape"
+            else:
+                maybe_key += f"{compile_range[0]}_{compile_range[1]}"
+            maybe_key += f"_subgraph_{graph_index}"
         with self.compile_context(compile_range):
             compiled_graph, handle = self.compiler.compile(
                 graph,
diff --git a/vllm/compilation/compiler_interface.py b/vllm/compilation/compiler_interface.py
@@ -594,8 +594,8 @@ def metrics_context(self) -> contextlib.AbstractContextManager:
 
 
 def set_inductor_config(config, compile_range):
-    if isinstance(compile_range, tuple):
-        # for a specific range of batchsizes, tuning triton kernel parameters
+    if isinstance(compile_range, tuple) and compile_range[0] == compile_range[1]:
+        # for a specific batch size, tuning triton kernel parameters
         # can be beneficial
         config["max_autotune"] = envs.VLLM_ENABLE_INDUCTOR_MAX_AUTOTUNE
         config["coordinate_descent_tuning"] = (