diff --git a/llms/mlx_lm/utils.py b/llms/mlx_lm/utils.py index e9388dbe..a7a998f4 100644 --- a/llms/mlx_lm/utils.py +++ b/llms/mlx_lm/utils.py @@ -58,8 +58,7 @@ def wired_limit(model): try: yield None finally: - # TODO... expose a synchronize?? - mx.zeros((1,)).item() + mx.synchronize() mx.metal.set_wired_limit(old_limit)