Add grid_sample example to metal_kernel docs (#1352)

* Add `zero_outputs` and `atomic_outputs` options to `metal_kernel` * add grid sample to docs * zero_outputs -> init_value * add missing header for linux
2025-12-16 01:49:05 +08:00 · 2024-08-23 18:24:16 -07:00
parent 3b4d5484c7
commit b96e105244
6 changed files with 337 additions and 15 deletions
--- a/mlx/backend/metal/custom_kernel.cpp
+++ b/mlx/backend/metal/custom_kernel.cpp
@@ -12,12 +12,17 @@ void CustomKernel::eval_gpu(
    std::vector<array>& outputs) {
  auto& s = stream();

+  std::vector<array> copies;
+
  for (auto& out : outputs) {
    out.set_data(allocator::malloc_or_wait(out.nbytes()));
+    if (init_value_) {
+      array init = array(init_value_.value(), out.dtype());
+      copy_gpu(init, out, CopyType::Scalar, s);
+      copies.push_back(init);
+    }
  }

-  std::vector<array> copies;
-
  auto check_input = [&copies, &s, this](const array& x) -> const array {
    bool no_copy = x.flags().row_contiguous;
    if (!ensure_row_contiguous_ || no_copy) {