removing tokenizer and updates

2025-12-16 02:08:55 +08:00 · 2025-01-26 15:25:27 +01:00
parent 4d0e52f7c8
commit 557649d8da
1 changed files with 0 additions and 3 deletions
--- a/llms/mlx_lm/tuner/dpo_trainer.py
+++ b/llms/mlx_lm/tuner/dpo_trainer.py
@@ -128,7 +128,6 @@ def dpo_loss(
        'chosen_logits_mean': mx.mean(policy_chosen_score)
    }
    return mx.mean(losses), reward, num_tokens, metrics
@@ -180,7 +179,6 @@ def evaluate_dpo(
    model,
    reference_model,
    dataset,
    tokenizer,
    batch_size,
    num_batches,
    beta: float,
@@ -328,7 +326,6 @@ def train_dpo(
                model=model,
                reference_model=reference_model,
                dataset=val_dataset,
                tokenizer=tokenizer,
                batch_size=args.batch_size,
                num_batches=args.val_batches,
                max_seq_length=args.max_seq_length,