cast around lora adapters (#613)

2025-12-16 02:08:55 +08:00 · 2024-03-24 19:34:51 -07:00
parent 5a52899405
commit bbfcc103d7
1 changed files with 2 additions and 5 deletions
--- a/llms/mlx_lm/tuner/lora.py
+++ b/llms/mlx_lm/tuner/lora.py
@@ -97,9 +97,6 @@ class LoRALinear(nn.Module):
        self.lora_b = mx.zeros(shape=(r, output_dims))

    def __call__(self, x):
-        dtype = self.linear.weight.dtype
-        if isinstance(self.linear, nn.QuantizedLinear):
-            dtype = self.linear.scales.dtype
-        y = self.linear(x.astype(dtype))
+        y = self.linear(x)
        z = (self.dropout(x) @ self.lora_a) @ self.lora_b
-        return y + self.scale * z
+        return y + (self.scale * z).astype(x.dtype)