From e17a7dc443bc5d5d603922b3df1737868ed35971 Mon Sep 17 00:00:00 2001 From: jamesm131 Date: Sun, 22 Sep 2024 20:10:56 +1000 Subject: [PATCH] Check hf_cache for mlx models --- llms/mlx_lm/server.py | 11 ++++++++++- 1 file changed, 10 insertions(+), 1 deletion(-) diff --git a/llms/mlx_lm/server.py b/llms/mlx_lm/server.py index 0c8ae83e..f2d8b86a 100644 --- a/llms/mlx_lm/server.py +++ b/llms/mlx_lm/server.py @@ -11,6 +11,7 @@ from pathlib import Path from typing import Dict, List, Literal, NamedTuple, Optional, Sequence, Union import mlx.core as mx +from huggingface_hub import scan_cache_dir from .utils import generate_step, load @@ -635,13 +636,21 @@ class APIHandler(BaseHTTPRequestHandler): """ self._set_completion_headers(200) self.end_headers() + + # Scan the cache directory for downloaded mlx models + hf_cache_info = scan_cache_dir() + downloaded_models = [ + repo for repo in hf_cache_info.repos if "mlx" in repo.repo_id + ] + # Create a list of available models models = [ { - "id": self.model_provider.cli_args.model, + "id": repo.repo_id, "object": "model", "created": self.created, } + for repo in downloaded_models ] response = {"object": "list", "data": models}