LoRA: Remove unnecessary model type judgments (#388)

* LoRA: Remove unnecessary model type judgments 1. Supported models are already checked in the load_model function in utils, no need to repeat the check in lora 2. The checks in lora are not synchronized with those in utils * LoRA: add LoRA supported models in mlx_lm utils
2025-08-09 02:16:37 +08:00 · 2024-02-01 03:55:27 +08:00 · 2024-02-01 03:55:27 +08:00 · ba3a9355d1
commit ba3a9355d1
parent 0a49ba0697
2 changed files with 6 additions and 7 deletions
--- a/llms/mlx_lm/lora.py
+++ b/llms/mlx_lm/lora.py
@ -7,13 +7,9 @@ import mlx.optimizers as optim
 import numpy as np
 from mlx.utils import tree_flatten
 from .models import llama, mixtral, phi2
 from .tuner.lora import LoRALinear
 from .tuner.trainer import TrainingArgs, evaluate, train
-from .utils import generate, load
+from .utils import generate, load, LORA_SUPPORTED_MODELS
 SUPPORTED_MODELS = [llama.Model, mixtral.Model, phi2.Model]
 def build_parser():
    parser = argparse.ArgumentParser(description="LoRA or QLoRA finetuning.")
@ -166,10 +162,10 @@ if __name__ == "__main__":
    print("Loading pretrained model")
    model, tokenizer = load(args.model)
-    if model.__class__ not in SUPPORTED_MODELS:
+    if model.__class__ not in LORA_SUPPORTED_MODELS:
        raise ValueError(
            f"Model {model.__class__} not supported. "
-            f"Supported models: { SUPPORTED_MODELS}"
+            f"Supported models: {LORA_SUPPORTED_MODELS}"
        )
    # Freeze all layers other than LORA linears
--- a/llms/mlx_lm/utils.py
+++ b/llms/mlx_lm/utils.py
@ -25,6 +25,9 @@ MODEL_MAPPING = {
    "qwen": qwen,
    "plamo": plamo,
 }
 LORA_SUPPORTED_MODELS = [
    llama.Model, mixtral.Model, phi2.Model, stablelm_epoch.Model
 ]
 MAX_FILE_SIZE_GB = 5
 linear_class_predicate = (