don't duplicate malloc with custom kernel init (#1830)

2025-12-16 01:49:05 +08:00 · 2025-02-04 13:20:57 -08:00
parent f6c0499b8d
commit a229c8cef0
1 changed files with 2 additions and 1 deletions
--- a/mlx/backend/metal/custom_kernel.cpp
+++ b/mlx/backend/metal/custom_kernel.cpp
@@ -15,10 +15,11 @@ void CustomKernel::eval_gpu(
  std::vector<array> copies;

  for (auto& out : outputs) {
-    out.set_data(allocator::malloc_or_wait(out.nbytes()));
    if (init_value_) {
      copies.emplace_back(init_value_.value(), out.dtype());
      fill_gpu(copies.back(), out, s);
+    } else {
+      out.set_data(allocator::malloc_or_wait(out.nbytes()));
    }
  }