fix llava (#1149)

2025-10-23 05:58:07 +08:00 · 2024-12-12 10:37:26 -08:00
parent 135c5818c1
commit 77b42b7c8b
3 changed files with 15 additions and 25 deletions
--- a/llms/mlx_lm/generate.py
+++ b/llms/mlx_lm/generate.py
@@ -1,6 +1,7 @@
 # Copyright © 2023-2024 Apple Inc.

 import argparse
+import codecs
 import json
 import sys

@@ -188,6 +189,8 @@ def main():
    elif using_cache:
        tokenizer.chat_template = metadata["chat_template"]

+    prompt = codecs.decode(args.prompt, "unicode_escape")
+
    if not args.ignore_chat_template and (
        hasattr(tokenizer, "apply_chat_template")
        and tokenizer.chat_template is not None
@@ -199,7 +202,7 @@ def main():
        messages.append(
            {
                "role": "user",
-                "content": sys.stdin.read() if args.prompt == "-" else args.prompt,
+                "content": sys.stdin.read() if prompt == "-" else prompt,
            }
        )
        prompt = tokenizer.apply_chat_template(
@@ -216,8 +219,6 @@ def main():
                add_generation_prompt=True,
            )
            prompt = prompt[test_prompt.index("<query>") :]
-    else:
-        prompt = args.prompt

    sampler = make_sampler(args.temp, args.top_p, args.min_p, args.min_tokens_to_keep)
    response = generate(