fix prompt cache with no chat template

2025-08-28 00:30:09 +08:00 · 2025-02-05 06:37:31 -08:00 · 2025-02-05 06:37:31 -08:00 · 087adcfacb
commit 087adcfacb
parent 6e6ba07b54
2 changed files with 2 additions and 2 deletions
--- a/llms/mlx_lm/cache_prompt.py
+++ b/llms/mlx_lm/cache_prompt.py
@ -152,7 +152,7 @@ def main():
    print("Saving...")
    metadata = {}
    metadata["model"] = args.model
-    metadata["chat_template"] = tokenizer.chat_template
+    metadata["chat_template"] = json.dumps(tokenizer.chat_template)
    metadata["tokenizer_config"] = json.dumps(tokenizer_config)
    save_prompt_cache(args.prompt_cache_file, cache, metadata)

--- a/llms/mlx_lm/generate.py
+++ b/llms/mlx_lm/generate.py
@ -199,7 +199,7 @@ def main():
        if tokenizer.chat_template is None:
            tokenizer.chat_template = tokenizer.default_chat_template
    elif using_cache:
-        tokenizer.chat_template = metadata["chat_template"]
+        tokenizer.chat_template = json.loads(metadata["chat_template"])

    prompt = args.prompt.replace("\\n", "\n").replace("\\t", "\t")
    prompt = sys.stdin.read() if prompt == "-" else prompt