Attempt different packing

This commit is contained in:
Angelos Katharopoulos
2024-12-13 18:36:36 -08:00
parent a06c968f4d
commit e4b587819c
4 changed files with 33 additions and 25 deletions

View File

@@ -5,11 +5,11 @@ from functools import partial
import mlx.core as mx
from time_utils import time_fn
D = 16384
D = 8192
group_size = 64
bits = 3
dtype = mx.float16
loops = 10
loops = 100
def qmv_(x, wq, q_type):