some nits in lora (#208)

awni · web-flow · commit e673a97c80a5 · 2025-06-05T16:33:16.000-07:00
diff --git a/mlx_lm/examples/lora_config.yaml b/mlx_lm/examples/lora_config.yaml
@@ -1,5 +1,5 @@
 # The path to the local model directory or Hugging Face repo.
-model: "mlx_model"
+model: "mlx-community/Llama-3.2-1B-Instruct"
 
 # Whether or not to train (boolean)
 train: true
@@ -17,7 +17,7 @@ optimizer: adamw
 #     bias_correction: true
 
 # Directory with {train, valid, test}.jsonl files
-data: "/path/to/training/data"
+data: "mlx-community/WikiSQL"
 
 # The PRNG seed
 seed: 0
diff --git a/mlx_lm/fuse.py b/mlx_lm/fuse.py
@@ -75,7 +75,9 @@ def main() -> None:
     model = load_adapters(model, args.adapter_path)
 
     fused_linears = [
-        (n, m.fuse()) for n, m in model.named_modules() if hasattr(m, "fuse")
+        (n, m.fuse(de_quantize=args.de_quantize))
+        for n, m in model.named_modules()
+        if hasattr(m, "fuse")
     ]
 
     if fused_linears:
diff --git a/mlx_lm/lora.py b/mlx_lm/lora.py
@@ -65,7 +65,7 @@
     "config": None,
     "grad_checkpoint": False,
     "lr_schedule": None,
-    "lora_parameters": {"rank": 8, "dropout": 0.0, "scale": 10.0},
+    "lora_parameters": {"rank": 8, "dropout": 0.0, "scale": 20.0},
     "mask_prompt": False,
     "wandb": None,
 }
diff --git a/mlx_lm/tuner/lora.py b/mlx_lm/tuner/lora.py
@@ -52,9 +52,8 @@ def fuse(self, de_quantize: bool = False):
         output_dims, input_dims = weight.shape
         fused_linear = nn.Linear(input_dims, output_dims, bias=bias)
 
-        lora_b = (self.scale * self.lora_b.T).astype(dtype)
-        lora_a = self.lora_a.T.astype(dtype)
-        fused_linear.weight = weight + lora_b @ lora_a
+        delta = ((self.scale * self.lora_b.T) @ self.lora_a.T).astype(dtype)
+        fused_linear.weight = weight + delta
         if bias:
             fused_linear.bias = linear.bias
 

Original file line number	Diff line number	Diff line change
`@@ -75,7 +75,9 @@ def main() -> None:`
`75`	`75`	`model = load_adapters(model, args.adapter_path)`
`76`	`76`
`77`	`77`	`fused_linears = [`
`78`		`- (n, m.fuse()) for n, m in model.named_modules() if hasattr(m, "fuse")`
	`78`	`+ (n, m.fuse(de_quantize=args.de_quantize))`
	`79`	`+ for n, m in model.named_modules()`
	`80`	`+ if hasattr(m, "fuse")`
`79`	`81`	`]`
`80`	`82`
`81`	`83`	`if fused_linears:`
Original file line number	Diff line number	Diff line change
`@@ -65,7 +65,7 @@`
`65`	`65`	`"config": None,`
`66`	`66`	`"grad_checkpoint": False,`
`67`	`67`	`"lr_schedule": None,`
`68`		`- "lora_parameters": {"rank": 8, "dropout": 0.0, "scale": 10.0},`
	`68`	`+ "lora_parameters": {"rank": 8, "dropout": 0.0, "scale": 20.0},`
`69`	`69`	`"mask_prompt": False,`
`70`	`70`	`"wandb": None,`
`71`	`71`	`}`