comment

2025-08-29 09:17:29 +08:00 · 2024-12-02 11:11:23 -08:00 · 2024-12-02 11:11:23 -08:00 · 5828703a5a
commit 5828703a5a
parent 80e5c37bb9
1 changed files with 2 additions and 1 deletions
--- a/llms/mlx_lm/utils.py
+++ b/llms/mlx_lm/utils.py
@ -458,13 +458,14 @@ def load_model(
        weights = model.sanitize(weights)
    if (quantization := config.get("quantization", None)) is not None:
-        # Handle legacy models which may not have everything quantized
+
        def class_predicate(p, m):
            # Handle custom per layer quantizations
            if p in config["quantization"]:
                return config["quantization"][p]
            if not hasattr(m, "to_quantized"):
                return False
            # Handle legacy models which may not have everything quantized
            return f"{p}.scales" in weights
        nn.quantize(