fix large ops (#1620)

2025-12-16 01:49:05 +08:00 · 2024-11-24 09:17:10 -08:00
parent bb303c45a5
commit 211411faf2
12 changed files with 37 additions and 25 deletions
--- a/mlx/backend/metal/ternary.cpp
+++ b/mlx/backend/metal/ternary.cpp
@@ -40,6 +40,9 @@ void ternary_op_gpu_inplace(
  auto ndim = shape.size();
  int work_per_thread;
  if (topt == TernaryOpType::General) {
+    large |=
+        (a.data_size() > UINT32_MAX || b.data_size() > UINT32_MAX ||
+         c.data_size() > UINT32_MAX);
    work_per_thread = large ? 4 : 2;
  } else {
    work_per_thread = 1;