to share quantization tables

Devjiu · Devjiu · commit d1d7f053d14b · 2025-05-16T13:46:39.000Z
diff --git a/bitsandbytes/backends/xpu/utils.py b/bitsandbytes/backends/xpu/utils.py
@@ -0,0 +1,50 @@
+import torch
+
+
+# Should be sorted to use binary search
+_NF4_QUANT_TABLE = torch.tensor(
+    [
+        -1.0,
+        -0.6961928009986877,
+        -0.5250730514526367,
+        -0.39491748809814453,
+        -0.28444138169288635,
+        -0.18477343022823334,
+        -0.09105003625154495,
+        0.0,
+        0.07958029955625534,
+        0.16093020141124725,
+        0.24611230194568634,
+        0.33791524171829224,
+        0.44070982933044434,
+        0.5626170039176941,
+        0.7229568362236023,
+        1.0,
+    ],
+    dtype=torch.float32,
+    device="xpu",
+)
+
+# Should be sorted to use binary search
+_FP4_QUANT_TABLE = torch.tensor(
+    [
+        -1.0000,
+        -0.6667,
+        -0.5000,
+        -0.3333,
+        -0.2500,
+        -0.1667,
+        -0.0052,
+        -0.0000,
+        0.0000,
+        0.0052,
+        0.1667,
+        0.2500,
+        0.3333,
+        0.5000,
+        0.6667,
+        1.0000,
+    ],
+    dtype=torch.float32,
+    device="xpu",
+)