vllm-project · houseroad · Jun 13, 2025 · Jun 13, 2025 · Jun 13, 2025 · houseroad
diff --git a/vllm/compilation/backends.py b/vllm/compilation/backends.py
@@ -31,7 +31,7 @@
 def make_compiler(compilation_config: CompilationConfig) -> CompilerInterface:
     if compilation_config.use_inductor:
         if envs.VLLM_USE_STANDALONE_COMPILE and is_torch_equal_or_newer(
-                "2.8.0"):
+                "2.8.0a"):
             logger.debug("Using InductorStandaloneAdaptor")
             return InductorStandaloneAdaptor()
         else:

@@ -44,14 +44,14 @@ def __init__(self,
         """
         # TorchAO quantization relies on tensor subclasses. In order,
         # to enable proper caching this needs standalone compile
-        if is_torch_equal_or_newer("2.8.0"):
+        if is_torch_equal_or_newer("2.8.0a"):
             os.environ["VLLM_TEST_STANDALONE_COMPILE"] = "1"
             logger.info(
                 "Using TorchAO: Setting VLLM_TEST_STANDALONE_COMPILE=1")
 
         # TODO: remove after the torch dependency is updated to 2.8
         if is_torch_equal_or_newer(
-                "2.7.0") and not is_torch_equal_or_newer("2.8.0"):
+                "2.7.0") and not is_torch_equal_or_newer("2.8.0a"):
             os.environ["VLLM_DISABLE_COMPILE_CACHE"] = "1"
             logger.info("Using TorchAO: Setting VLLM_DISABLE_COMPILE_CACHE=1")
         """