Passing parameterized loss and batching to trainer (#391)

2025-12-15 01:42:31 +08:00 · 2024-02-13 10:03:25 -05:00
parent 954aa50c54
commit e446598f62
1 changed files with 3 additions and 0 deletions
--- a/llms/mlx_lm/tuner/trainer.py
+++ b/llms/mlx_lm/tuner/trainer.py
@@ -99,6 +99,7 @@ def evaluate(
    num_batches,
    max_seq_length=2048,
    loss: callable = default_loss,
    iterate_batches: callable = iterate_batches
 ):
    all_losses = []
    ntokens = 0
@@ -126,6 +127,7 @@ def train(
    val_dataset,
    args: TrainingArgs = TrainingArgs(),
    loss: callable = default_loss,
    iterate_batches: callable = iterate_batches
 ):
    # Create checkpoints directory if it does not exist
    if not os.path.exists("checkpoints"):
@@ -186,6 +188,7 @@ def train(
                batch_size=args.batch_size,
                num_batches=args.val_batches,
                max_seq_length=args.max_seq_length,
                iterate_batches=iterate_batches
            )
            print(
                f"Iter {it + 1}: "