diff --git a/llms/mlx_lm/chat.py b/llms/mlx_lm/chat.py index 09a39e59..1c135ad1 100644 --- a/llms/mlx_lm/chat.py +++ b/llms/mlx_lm/chat.py @@ -5,7 +5,7 @@ import json import mlx.core as mx -from .models.cache import load_prompt_cache, make_prompt_cache, save_prompt_cache +from .models.cache import make_prompt_cache from .utils import load, stream_generate DEFAULT_TEMP = 0.0