We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5ca7b40 commit 728f7a2Copy full SHA for 728f7a2
vllm/model_executor/layers/quantization/kernels/mixed_precision/machete.py
@@ -32,6 +32,9 @@ def can_implement(cls,
32
if not current_platform.is_cuda():
33
return False, "Machete only supported on CUDA"
34
35
+ if not current_platform.is_device_capability(90):
36
+ return False, "Machete requires compute capability of 90 (Hopper)"
37
+
38
if c.has_g_idx and\
39
c.partition_weight_shape[0] != c.full_weight_shape[0]:
40
return False, "Act reordering currently not supported by Machete, "\
0 commit comments