Merge branch 'ml-explore:main' into adding-GRPO-training

2025-12-16 02:08:55 +08:00 · 2025-02-22 19:11:26 +01:00
parent c0bd89aa15 09b641aaa7
commit bd5f081ca5
5 changed files with 16 additions and 22 deletions
--- a/llms/mlx_lm/lora.py
+++ b/llms/mlx_lm/lora.py
@@ -285,8 +285,14 @@ def train_model(
    training_callback: TrainingCallback = None,
 ):
    model.freeze()
+    if args.num_layers > len(model.layers):
+        raise ValueError(
+            f"Requested to train {args.num_layers} layers "
+            f"but the model only has {len(model.layers)} layers."
+        )
+
    if args.fine_tune_type == "full":
-        for l in model.layers[-min(args.num_layers, 0) :]:
+        for l in model.layers[-max(args.num_layers, 0) :]:
            l.unfreeze()
    elif args.fine_tune_type in ["lora", "dora"]:
        # Convert linear layers to lora/dora layers and unfreeze in the process