diff --git a/llms/mlx_lm/tuner/orpo_trainer.py b/llms/mlx_lm/tuner/orpo_trainer.py index 4eaace31..608d0dd0 100644 --- a/llms/mlx_lm/tuner/orpo_trainer.py +++ b/llms/mlx_lm/tuner/orpo_trainer.py @@ -84,6 +84,7 @@ def orpo_loss( return loss, reward, num_tokens + def evaluate_orpo( model, dataset,