mirror of
https://github.com/ml-explore/mlx-examples.git
synced 2025-09-15 23:58:08 +08:00
niits
This commit is contained in:
@@ -312,7 +312,7 @@ def train_orpo(
|
||||
if rank == 0:
|
||||
print(
|
||||
f"Iter {it}: "
|
||||
f"Val loss {val_loss:.3f}, "
|
||||
f"Val loss {val_loss:.8f}, "
|
||||
f"Val chosen reward {val_rewards[0]:.3f}, "
|
||||
f"Val rejected reward {val_rewards[1]:.3f}, "
|
||||
f"Val took {val_time:.3f}s",
|
||||
@@ -353,7 +353,7 @@ def train_orpo(
|
||||
|
||||
if rank == 0:
|
||||
print(
|
||||
f"Iter {it}: Train loss {train_loss:.3f}, "
|
||||
f"Iter {it}: Train loss {train_loss:.8f}, "
|
||||
f"Chosen reward {train_rewards[0]:.3f}, "
|
||||
f"Rejected reward {train_rewards[1]:.3f}, "
|
||||
f"Learning Rate {learning_rate:.3e}, "
|
||||
|
Reference in New Issue
Block a user