mirror of
https://github.com/ml-explore/mlx-examples.git
synced 2025-06-24 09:21:18 +08:00
BUG FIX: Decoding results in garbled text when multiple tokens represent a single character (e.g., Chinese). (#398)
* Decoding results in garbled text when multiple tokens represent a single character (e.g., Chinese). * Decoding results in garbled text when multiple tokens represent a single character (e.g., Chinese).
This commit is contained in:
parent
94358219cf
commit
0340113e02
@ -292,8 +292,9 @@ def generate(model, prompt, tokenizer, args):
|
|||||||
|
|
||||||
tokens.append(token.item())
|
tokens.append(token.item())
|
||||||
s = tokenizer.decode(tokens)
|
s = tokenizer.decode(tokens)
|
||||||
print(s[skip:], end="", flush=True)
|
if len(s) - skip > 1:
|
||||||
skip = len(s)
|
print(s[skip:-1], end="", flush=True)
|
||||||
|
skip = len(s) - 1
|
||||||
print(tokenizer.decode(tokens)[skip:], flush=True)
|
print(tokenizer.decode(tokens)[skip:], flush=True)
|
||||||
print("=" * 10)
|
print("=" * 10)
|
||||||
if len(tokens) == 0:
|
if len(tokens) == 0:
|
||||||
|
Loading…
Reference in New Issue
Block a user