From e3d275bc4929af285e8c58ebae3f23a698e317f3 Mon Sep 17 00:00:00 2001 From: Alex Barron Date: Mon, 14 Apr 2025 16:37:23 -0700 Subject: [PATCH] rebase on main --- mlx/backend/metal/primitives.cpp | 2 +- mlx/backend/metal/quantized.cpp | 10 +++++----- 2 files changed, 6 insertions(+), 6 deletions(-) diff --git a/mlx/backend/metal/primitives.cpp b/mlx/backend/metal/primitives.cpp index e47ee9030..1bcff36bd 100644 --- a/mlx/backend/metal/primitives.cpp +++ b/mlx/backend/metal/primitives.cpp @@ -232,7 +232,7 @@ void ArgReduce::eval_gpu(const std::vector& inputs, array& out) { break; } auto& in = inputs[0]; - out.set_data(allocator::malloc_or_wait(out.nbytes())); + out.set_data(allocator::malloc(out.nbytes())); auto& s = stream(); arg_reduce_dispatch(in, out, axis_, op_name, s); } diff --git a/mlx/backend/metal/quantized.cpp b/mlx/backend/metal/quantized.cpp index 964eb081e..9eac24332 100644 --- a/mlx/backend/metal/quantized.cpp +++ b/mlx/backend/metal/quantized.cpp @@ -636,7 +636,7 @@ void fast::TrellisQuantize::eval_gpu( std::vector& outputs) { auto& w_pre = inputs[0]; auto& out = outputs[0]; - out.set_data(allocator::malloc_or_wait(out.nbytes())); + out.set_data(allocator::malloc(out.nbytes())); auto& s = stream(); auto& d = metal::device(s.device); @@ -660,19 +660,19 @@ void fast::TrellisQuantize::eval_gpu( constexpr int num_states = 1 << 14; array scores({B, num_states}, float16, nullptr, {}); - scores.set_data(allocator::malloc_or_wait(scores.nbytes())); + scores.set_data(allocator::malloc(scores.nbytes())); copies.push_back(scores); array pointers({B, T, num_states}, uint8, nullptr, {}); - pointers.set_data(allocator::malloc_or_wait(pointers.nbytes())); + pointers.set_data(allocator::malloc(pointers.nbytes())); copies.push_back(pointers); array start({B}, uint32, nullptr, {}); - start.set_data(allocator::malloc_or_wait(start.nbytes())); + start.set_data(allocator::malloc(start.nbytes())); copies.push_back(start); array rolled({B, T}, uint16, nullptr, {}); - rolled.set_data(allocator::malloc_or_wait(rolled.nbytes())); + rolled.set_data(allocator::malloc(rolled.nbytes())); copies.push_back(rolled); viterbi(w, scores, pointers, start, out, false, s);