diff --git a/llms/mlx_lm/tokenizer_utils.py b/llms/mlx_lm/tokenizer_utils.py index 60cfb555..114a35e7 100644 --- a/llms/mlx_lm/tokenizer_utils.py +++ b/llms/mlx_lm/tokenizer_utils.py @@ -51,7 +51,7 @@ class StreamingDetokenizer: text = self.text segment = text[self.offset :] self.offset = len(text) - return text + return segment class NaiveStreamingDetokenizer(StreamingDetokenizer):