diff --git a/llms/mlx_lm/models/mamba2.py b/llms/mlx_lm/models/mamba2.py index 981daa74..822ebe8a 100644 --- a/llms/mlx_lm/models/mamba2.py +++ b/llms/mlx_lm/models/mamba2.py @@ -65,6 +65,7 @@ def silu(x): def ssd(x, A, B, C, chunk_size): batch, seqlen, nheads, dim = x.shape + B = mx.expand_dims(B, axis=2) C = mx.expand_dims(C, axis=2)