Use .to() instead of get_original_weight in linear_nf4 backward (#90)

rohan-varma · cpuhrsch · web-flow · commit a7670be58700 · 2024-03-27T21:07:40.000-07:00
Co-authored-by: cpuhrsch &lt;cpuhrsch@googlemail.com&gt;
diff --git a/torchao/dtypes/nf4tensor.py b/torchao/dtypes/nf4tensor.py
@@ -569,9 +569,9 @@ def forward(ctx, input: torch.Tensor, weight: NF4Tensor):
     #  inconsistently.
 
     def backward(ctx, grad_output):
-        """The nf4 weight will never require grad so we can just return the grad_output @ weight.get_original_weight()"""
+        """The nf4 weight will never require grad so we can just return the grad_output @ weight.to(grad_output.dtype)"""
         weight: NF4Tensor = ctx.nf4_weight
-        return grad_output @ weight.get_original_weight(), None
+        return grad_output @ weight.to(grad_output.dtype), None
 
 
 def linear_nf4(input: torch.Tensor, weight: NF4Tensor) -> torch.Tensor: