comment

2025-09-01 12:49:50 +08:00 · 2024-12-02 11:11:23 -08:00
parent 80e5c37bb9
commit 5828703a5a
1 changed files with 2 additions and 1 deletions
--- a/llms/mlx_lm/utils.py
+++ b/llms/mlx_lm/utils.py
@@ -458,13 +458,14 @@ def load_model(
        weights = model.sanitize(weights)

    if (quantization := config.get("quantization", None)) is not None:
-        # Handle legacy models which may not have everything quantized
+
        def class_predicate(p, m):
            # Handle custom per layer quantizations
            if p in config["quantization"]:
                return config["quantization"][p]
            if not hasattr(m, "to_quantized"):
                return False
+            # Handle legacy models which may not have everything quantized
            return f"{p}.scales" in weights

        nn.quantize(