File tree Expand file tree Collapse file tree 2 files changed +3
-3
lines changed
model_executor/layers/quantization Expand file tree Collapse file tree 2 files changed +3
-3
lines changed Original file line number Diff line number Diff line change 3131def make_compiler (compilation_config : CompilationConfig ) -> CompilerInterface :
3232 if compilation_config .use_inductor :
3333 if envs .VLLM_USE_STANDALONE_COMPILE and is_torch_equal_or_newer (
34- "2.8.0 " ):
34+ "2.8.0a " ):
3535 logger .debug ("Using InductorStandaloneAdaptor" )
3636 return InductorStandaloneAdaptor ()
3737 else :
Original file line number Diff line number Diff line change @@ -44,14 +44,14 @@ def __init__(self,
4444 """
4545 # TorchAO quantization relies on tensor subclasses. In order,
4646 # to enable proper caching this needs standalone compile
47- if is_torch_equal_or_newer("2.8.0 "):
47+ if is_torch_equal_or_newer("2.8.0a "):
4848 os.environ["VLLM_TEST_STANDALONE_COMPILE"] = "1"
4949 logger.info(
5050 "Using TorchAO: Setting VLLM_TEST_STANDALONE_COMPILE=1")
5151
5252 # TODO: remove after the torch dependency is updated to 2.8
5353 if is_torch_equal_or_newer(
54- "2.7.0") and not is_torch_equal_or_newer("2.8.0 "):
54+ "2.7.0") and not is_torch_equal_or_newer("2.8.0a "):
5555 os.environ["VLLM_DISABLE_COMPILE_CACHE"] = "1"
5656 logger.info("Using TorchAO: Setting VLLM_DISABLE_COMPILE_CACHE=1")
5757 """
You can’t perform that action at this time.
0 commit comments