From d9da35f458ffbd145350a3c19b6a6b607698ee8e Mon Sep 17 00:00:00 2001 From: Goekdeniz-Guelmez Date: Mon, 10 Feb 2025 10:52:32 +0100 Subject: [PATCH] nits --- llms/mlx_lm/tuner/grpo_trainer.py | 3 --- 1 file changed, 3 deletions(-) diff --git a/llms/mlx_lm/tuner/grpo_trainer.py b/llms/mlx_lm/tuner/grpo_trainer.py index b3619e0a..1f9ef18a 100644 --- a/llms/mlx_lm/tuner/grpo_trainer.py +++ b/llms/mlx_lm/tuner/grpo_trainer.py @@ -142,9 +142,6 @@ def generate_grpo(model, prompt, max_tokens, tokenizer, temperature): if current_length >= end_sequence_length: last_tokens = output[current_length - end_sequence_length:current_length].tolist() - # print(f"Last tokens: {last_tokens}") - # print(f"Decoded text: {tokenizer.decode(last_tokens)}") - # print(f"Target sequence: {end_sequence}") if last_tokens == end_sequence: break