Faster indexing math in a few kernels (#1589)

* wip: faster compiled kernels * faster general unary with uint specialization * index type in compiled, unary, binary, ternary, copy * fix jit * jit fix * specialize gather + scatter * nit in docs
2025-12-16 01:49:05 +08:00 · 2024-11-18 19:52:00 -08:00
parent bf481e8e5d
commit 2419edd5b2
25 changed files with 630 additions and 484 deletions
--- a/mlx/backend/metal/utils.h
+++ b/mlx/backend/metal/utils.h
@@ -61,4 +61,15 @@ inline void debug_set_primitive_buffer_label(

 std::string get_primitive_string(Primitive* primitive);

+template <typename T>
+void concatenate(std::string& acc, T first) {
+  acc += first;
+}
+
+template <typename T, typename... Args>
+void concatenate(std::string& acc, T first, Args... args) {
+  acc += first;
+  concatenate(acc, args...);
+}
+
 } // namespace mlx::core