vllm-project · rafvasq · Jul 16, 2025 · Jul 22, 2025 · Jul 22, 2025 · Jul 22, 2025
@@ -40,7 +40,9 @@ class SpyrePlatform(Platform):
     # "spyre" device_name no longer worked due to https://github.com/vllm-project/vllm/pull/16464
     device_name: str = "cpu"
     device_type: str = "cpu"
-    supported_quantization: list[str] = ["gptq"]
+    # compressed-tensors supported by
+    # https://github.com/foundation-model-stack/fms-model-optimizer/blob/main/fms_mo/aiu_addons/__init__.py
+    supported_quantization: list[str] = ["gptq", "compressed-tensors"]
     _warmup_shapes: Optional[tuple[dict[str, int], ...]] = None
     _block_size: int = 64  # hardcoded Spyre constraint for now
     _config: VllmConfig = None