Add softmin, hardshrink, hardtanh (#1180)

--------- Co-authored-by: Nikhil Mehta <nikmehta@tesla.com>
2025-12-16 01:49:05 +08:00 · 2024-06-04 15:48:18 -07:00
parent 83b11bc58d
commit 0b7d71fd2f
14 changed files with 110 additions and 20 deletions
--- a/python/tests/test_fast_sdpa.py
+++ b/python/tests/test_fast_sdpa.py
@@ -15,7 +15,6 @@ def mlx_primitives_sdpa(q, k, v, scale):

 # SDPA for GQA (n_heads > n_kv_heads, n_kv_heads > 1, n_heads % n_kv_heads == 0)
 def mlx_primitives_sdpa_with_gqa(q, k, v, scale):
-
    n_repeats = q.shape[1] // k.shape[1]

    # borrowing kv cache tiling from mlx-examples/llms/mistral/mistral.py
@@ -34,7 +33,6 @@ def mlx_primitives_sdpa_with_gqa(q, k, v, scale):

 class TestFastSelfAttentionSDPA(mlx_tests.MLXTestCase):
    def test_fast_sdpa(self):
-
        # Not yet supported:
        # * K pre-transposed in kernel, V pre-transposed in kernel
        np.random.seed(0)