5bit quants

This commit is contained in:
Awni Hannun
2025-05-28 10:28:10 -07:00
parent 54a71f270a
commit 9754ea5f63
7 changed files with 246 additions and 71 deletions

View File

@@ -634,6 +634,7 @@ class TestVmap(mlx_tests.MLXTestCase):
self.assertEqual(fy.shape, (4, 5, 6, 7))
def test_leaks(self):
gc.collect()
mx.synchronize()
if mx.metal.is_available():
mem_pre = mx.get_active_memory()
@@ -653,6 +654,7 @@ class TestVmap(mlx_tests.MLXTestCase):
outer()
gc.collect()
mx.synchronize()
if mx.metal.is_available():
mem_post = mx.get_active_memory()
else: