improve quant docs

This commit is contained in:
Awni Hannun
2025-10-28 07:12:35 -07:00
parent 94fe5114fa
commit 5a043fd793
3 changed files with 42 additions and 32 deletions

View File

@@ -146,7 +146,7 @@ class TestQuantized(mlx_tests.MLXTestCase):
w_q, scales = mx.quantize(w, mode="nvfp4")
with self.assertRaises(ValueError):
mx.dequantize(w_q, scales, mode="nvfp4")
mx.dequantize(w_q, scales, bits=3, mode="nvfp4")
with self.assertRaises(ValueError):
mx.dequantize(w_q, scales, group_size=32, mode="nvfp4")