comment

2025-08-29 03:55:20 +08:00 · 2024-12-02 11:11:23 -08:00 · 2024-12-02 11:11:23 -08:00 · 5828703a5a
commit 5828703a5a
parent 80e5c37bb9
1 changed files with 2 additions and 1 deletions
--- a/llms/mlx_lm/utils.py
+++ b/llms/mlx_lm/utils.py
@ -458,13 +458,14 @@ def load_model(
        weights = model.sanitize(weights)

    if (quantization := config.get("quantization", None)) is not None:
-        # Handle legacy models which may not have everything quantized
+
        def class_predicate(p, m):
            # Handle custom per layer quantizations
            if p in config["quantization"]:
                return config["quantization"][p]
            if not hasattr(m, "to_quantized"):
                return False
+            # Handle legacy models which may not have everything quantized
            return f"{p}.scales" in weights

        nn.quantize(