diff --git a/llms/mlx_lm/server.py b/llms/mlx_lm/server.py index f2d8b86a..42962b54 100644 --- a/llms/mlx_lm/server.py +++ b/llms/mlx_lm/server.py @@ -594,6 +594,7 @@ class APIHandler(BaseHTTPRequestHandler): ): prompt = self.tokenizer.apply_chat_template( body["messages"], + body.get("tools", None), tokenize=True, add_generation_prompt=True, )