File tree Expand file tree Collapse file tree 2 files changed +3
-3
lines changed
model_executor/layers/quantization Expand file tree Collapse file tree 2 files changed +3
-3
lines changed Original file line number Diff line number Diff line change 31
31
def make_compiler (compilation_config : CompilationConfig ) -> CompilerInterface :
32
32
if compilation_config .use_inductor :
33
33
if envs .VLLM_USE_STANDALONE_COMPILE and is_torch_equal_or_newer (
34
- "2.8.0 " ):
34
+ "2.8.0a " ):
35
35
logger .debug ("Using InductorStandaloneAdaptor" )
36
36
return InductorStandaloneAdaptor ()
37
37
else :
Original file line number Diff line number Diff line change @@ -44,14 +44,14 @@ def __init__(self,
44
44
"""
45
45
# TorchAO quantization relies on tensor subclasses. In order,
46
46
# to enable proper caching this needs standalone compile
47
- if is_torch_equal_or_newer("2.8.0 "):
47
+ if is_torch_equal_or_newer("2.8.0a "):
48
48
os.environ["VLLM_TEST_STANDALONE_COMPILE"] = "1"
49
49
logger.info(
50
50
"Using TorchAO: Setting VLLM_TEST_STANDALONE_COMPILE=1")
51
51
52
52
# TODO: remove after the torch dependency is updated to 2.8
53
53
if is_torch_equal_or_newer(
54
- "2.7.0") and not is_torch_equal_or_newer("2.8.0 "):
54
+ "2.7.0") and not is_torch_equal_or_newer("2.8.0a "):
55
55
os.environ["VLLM_DISABLE_COMPILE_CACHE"] = "1"
56
56
logger.info("Using TorchAO: Setting VLLM_DISABLE_COMPILE_CACHE=1")
57
57
"""
You can’t perform that action at this time.
0 commit comments