mirror of
https://github.com/ml-explore/mlx-examples.git
synced 2025-06-26 02:33:23 +08:00
fix testing
This commit is contained in:
parent
2a8e6f6e44
commit
d84ad0cf86
@ -342,7 +342,7 @@ def evaluate_model(args, model: nn.Module, tokenizer: TokenizerWrapper, test_set
|
||||
else:
|
||||
reference_model = model
|
||||
|
||||
test_loss, test_rewards = evaluate_grpo(
|
||||
test_loss, _, test_rewards = evaluate_grpo(
|
||||
model=model,
|
||||
ref_model=reference_model,
|
||||
dataset=test_set,
|
||||
@ -354,7 +354,10 @@ def evaluate_model(args, model: nn.Module, tokenizer: TokenizerWrapper, test_set
|
||||
group_size=args.group_size,
|
||||
epsilon=args.epsilon
|
||||
)
|
||||
print(f"Test loss {test_loss:.3f}, Rewards: {test_rewards[0]:.3f}, {test_rewards[1]:.3f}")
|
||||
|
||||
test_ppl = math.exp(test_loss)
|
||||
|
||||
print(f"Test loss {test_loss:.3f}, Test ppl {test_ppl:.3f}, Rewards: {test_rewards[0]:.3f}, {test_rewards[1]:.3f}")
|
||||
else:
|
||||
test_loss = evaluate(
|
||||
model=model,
|
||||
|
Loading…
Reference in New Issue
Block a user