From 8680bb614e83d1fc59b2c23e06ec554af12467af Mon Sep 17 00:00:00 2001 From: sealad886 <155285242+sealad886@users.noreply.github.com> Date: Sun, 16 Mar 2025 08:31:47 +0000 Subject: [PATCH] Update mixed_2_6 and mixed_3_6 quant predicates to explicitly pass high_bits parameter --- llms/mlx_lm/utils.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/llms/mlx_lm/utils.py b/llms/mlx_lm/utils.py index 05fac92f..a09f2491 100644 --- a/llms/mlx_lm/utils.py +++ b/llms/mlx_lm/utils.py @@ -1052,8 +1052,8 @@ def mixed_quant_predicate_builder( return mixed_quant_predicate -mixed_3_6 = mixed_quant_predicate_builder(low_bits=3) -mixed_2_6 = mixed_quant_predicate_builder(low_bits=2) +mixed_3_6 = mixed_quant_predicate_builder(low_bits=3, high_bits=6) +mixed_2_6 = mixed_quant_predicate_builder(low_bits=2, high_bits=6) def convert(