log depyf folder, fix context for TestBackend, fix pattern dump

ProExpertProg · ProExpertProg · commit c8675ffdbcf5 · 2025-10-11T23:32:47.000-04:00
Signed-off-by: Luka Govedič &lt;lgovedic@redhat.com&gt;
diff --git a/tests/compile/backend.py b/tests/compile/backend.py
@@ -3,6 +3,7 @@
 
 import weakref
 from collections.abc import Sequence
+from contextlib import nullcontext
 from copy import deepcopy
 from typing import Callable, Union
 
@@ -16,6 +17,9 @@
 from vllm.compilation.pass_manager import with_pattern_match_debug
 from vllm.compilation.vllm_inductor_pass import VllmInductorPass
 from vllm.config import VllmConfig, get_current_vllm_config
+from vllm.logger import init_logger
+
+logger = init_logger("vllm.tests.compile.backend")
 
 
 class LazyInitPass(InductorPass):
@@ -55,16 +59,19 @@ def __init__(self, *passes: Union[InductorPass, Callable[[fx.Graph], None]]):
         self.inductor_config["post_grad_custom_post_pass"] = self.post_pass
 
         if debug_dump_path := vllm_config.compile_debug_dump_path():
-            self.ctx = depyf.prepare_debug(debug_dump_path.as_posix())
-            self.ctx.__enter__()
+            logger.debug("Dumping depyf output to %s", debug_dump_path)
+            self.debug_ctx = depyf.prepare_debug(debug_dump_path.as_posix())
         else:
-            self.ctx = None
+            self.debug_ctx = nullcontext()
 
     def __call__(self, graph: fx.GraphModule, example_inputs):
         self.graph_pre_compile = deepcopy(graph)
         from torch._inductor.compile_fx import compile_fx
 
-        return compile_fx(graph, example_inputs, config_patches=self.inductor_config)
+        with self.debug_ctx:
+            return compile_fx(
+                graph, example_inputs, config_patches=self.inductor_config
+            )
 
     @with_pattern_match_debug
     def post_pass(self, graph: fx.Graph):
@@ -83,9 +90,6 @@ def post_pass(self, graph: fx.Graph):
         # assign by reference, will reflect the final state of the graph
         self.final_graph = graph
 
-        if self.ctx is not None:
-            self.ctx.__exit__(None, None, None)
-
     def check_before_ops(self, ops: Sequence[OpOverload], fully_replaced=True):
         for op in ops:
             num_pre = len(list(find_op_nodes(op, self.graph_pre_pass)))
diff --git a/vllm/compilation/monitor.py b/vllm/compilation/monitor.py
@@ -22,6 +22,7 @@ def start_monitoring_torch_compile(vllm_config: VllmConfig):
         import depyf
 
         path.mkdir(parents=True, exist_ok=True)
+        logger.debug("Dumping depyf output to %s", path)
         global context_manager
         context_manager = depyf.prepare_debug(path.as_posix())
         context_manager.__enter__()
diff --git a/vllm/compilation/vllm_inductor_pass.py b/vllm/compilation/vllm_inductor_pass.py
@@ -115,7 +115,8 @@ def dump_patterns(self, config: VllmConfig, pm_pass: PatternMatcherPass):
                 f" please add to dump_patterns if there are any errors.\n\n"
                 f"from torch._higher_order_ops.auto_functionalize import "
                 f"auto_functionalized as auto_functionalized\n"
-                f"from torch._inductor.pattern_matcher import *",
+                f"from torch._inductor.pattern_matcher import *\n"
+                f"vllm = torch.ops.vllm",
                 file=f,
             )
 

Original file line number	Diff line number	Diff line change
`@@ -115,7 +115,8 @@ def dump_patterns(self, config: VllmConfig, pm_pass: PatternMatcherPass):`
`115`	`115`	`f" please add to dump_patterns if there are any errors.\n\n"`
`116`	`116`	`f"from torch._higher_order_ops.auto_functionalize import "`
`117`	`117`	`f"auto_functionalized as auto_functionalized\n"`
`118`		`- f"from torch._inductor.pattern_matcher import *",`
	`118`	`+ f"from torch._inductor.pattern_matcher import *\n"`
	`119`	`+ f"vllm = torch.ops.vllm",`
`119`	`120`	`file=f,`
`120`	`121`	`)`
`121`	`122`