From 18c9652ec28f9549d1ab798a282ce3747e56f57d Mon Sep 17 00:00:00 2001 From: "chenguangjian.jk" Date: Mon, 5 Aug 2024 10:33:21 +0800 Subject: [PATCH] mlx_lm.server --model mlx-community/gemma-2-9b-it-8bit --trust-remote-code --port 8722 --- llms/mlx_lm/Makefile | 12 +++++++++--- 1 file changed, 9 insertions(+), 3 deletions(-) diff --git a/llms/mlx_lm/Makefile b/llms/mlx_lm/Makefile index 94844d12..26786dba 100644 --- a/llms/mlx_lm/Makefile +++ b/llms/mlx_lm/Makefile @@ -1,5 +1,13 @@ +c: + conda activate m3mlx + +cd_mlx_lm: + cd llms/mlx_lm + + run: - mlx_lm.server --model mlx-community/Mistral-Nemo-Instruct-2407-8bit --trust-remote-code --port 8722 + #mlx_lm.server --model mlx-community/Mistral-Nemo-Instruct-2407-8bit --trust-remote-code --port 8722 + mlx_lm.server --model mlx-community/gemma-2-9b-it-8bit --trust-remote-code --port 8722 k: ./kill.sh @@ -7,5 +15,3 @@ k: w: curl -X GET "http://127.0.0.1:9000/api/ai/WriteBlogRandomlyWithLLM?model=MLXLMServer" -H "Request-Origion:SwaggerBootstrapUi" -H "accept:*/*" -c: - conda activate m3mlx \ No newline at end of file