2024-03-19 11:12:25 +08:00
|
|
|
// Copyright © 2023-2024 Apple Inc.
|
2023-12-01 03:12:53 +08:00
|
|
|
|
2023-11-30 02:30:41 +08:00
|
|
|
#include <numeric>
|
|
|
|
#include <sstream>
|
|
|
|
|
|
|
|
#include "python/src/indexing.h"
|
|
|
|
|
|
|
|
#include "mlx/ops.h"
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
bool is_none_slice(const nb::slice& in_slice) {
|
2023-11-30 02:30:41 +08:00
|
|
|
return (
|
2024-03-19 11:12:25 +08:00
|
|
|
nb::getattr(in_slice, "start").is_none() &&
|
|
|
|
nb::getattr(in_slice, "stop").is_none() &&
|
|
|
|
nb::getattr(in_slice, "step").is_none());
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
int get_slice_int(nb::object obj, int default_val) {
|
2023-11-30 02:30:41 +08:00
|
|
|
if (!obj.is_none()) {
|
2024-03-19 11:12:25 +08:00
|
|
|
if (!nb::isinstance<nb::int_>(obj)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
throw std::invalid_argument("Slice indices must be integers or None.");
|
|
|
|
}
|
2024-03-19 11:12:25 +08:00
|
|
|
return nb::cast<int>(nb::cast<nb::int_>(obj));
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
return default_val;
|
|
|
|
}
|
|
|
|
|
|
|
|
void get_slice_params(
|
|
|
|
int& starts,
|
|
|
|
int& ends,
|
|
|
|
int& strides,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::slice& in_slice,
|
2023-11-30 02:30:41 +08:00
|
|
|
int axis_size) {
|
|
|
|
// Following numpy's convention
|
|
|
|
// Assume n is the number of elements in the dimension being sliced.
|
|
|
|
// Then, if i is not given it defaults to 0 for k > 0 and n - 1 for
|
|
|
|
// k < 0 . If j is not given it defaults to n for k > 0 and -n-1 for
|
|
|
|
// k < 0 . If k is not given it defaults to 1
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
strides = get_slice_int(nb::getattr(in_slice, "step"), 1);
|
2023-11-30 02:30:41 +08:00
|
|
|
starts = get_slice_int(
|
2024-03-19 11:12:25 +08:00
|
|
|
nb::getattr(in_slice, "start"), strides < 0 ? axis_size - 1 : 0);
|
2023-11-30 02:30:41 +08:00
|
|
|
ends = get_slice_int(
|
2024-03-19 11:12:25 +08:00
|
|
|
nb::getattr(in_slice, "stop"), strides < 0 ? -axis_size - 1 : axis_size);
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
array get_int_index(nb::object idx, int axis_size) {
|
|
|
|
int idx_ = nb::cast<int>(idx);
|
2023-11-30 02:30:41 +08:00
|
|
|
idx_ = (idx_ < 0) ? idx_ + axis_size : idx_;
|
|
|
|
|
|
|
|
return array(idx_, uint32);
|
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
bool is_valid_index_type(const nb::object& obj) {
|
|
|
|
return nb::isinstance<nb::slice>(obj) || nb::isinstance<nb::int_>(obj) ||
|
|
|
|
nb::isinstance<array>(obj) || obj.is_none() || nb::ellipsis().is(obj);
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
array mlx_get_item_slice(const array& src, const nb::slice& in_slice) {
|
2023-11-30 02:30:41 +08:00
|
|
|
// Check input and raise error if 0 dim for parity with np
|
|
|
|
if (src.ndim() == 0) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"too many indices for array: array is 0-dimensional");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Return a copy of the array if none slice is request
|
|
|
|
if (is_none_slice(in_slice)) {
|
|
|
|
return src;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<int> starts(src.ndim(), 0);
|
|
|
|
std::vector<int> ends = src.shape();
|
|
|
|
std::vector<int> strides(src.ndim(), 1);
|
|
|
|
|
|
|
|
// Check and update slice params
|
|
|
|
get_slice_params(starts[0], ends[0], strides[0], in_slice, ends[0]);
|
|
|
|
return slice(src, starts, ends, strides);
|
|
|
|
}
|
|
|
|
|
|
|
|
array mlx_get_item_array(const array& src, const array& indices) {
|
|
|
|
// Check input and raise error if 0 dim for parity with np
|
|
|
|
if (src.ndim() == 0) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"too many indices for array: array is 0-dimensional");
|
|
|
|
}
|
|
|
|
|
|
|
|
if (indices.dtype() == bool_) {
|
|
|
|
throw std::invalid_argument("boolean indices are not yet supported");
|
|
|
|
}
|
|
|
|
|
|
|
|
// If only one input array is mentioned, we set axis=0 in take
|
|
|
|
// for parity with np
|
|
|
|
return take(src, indices, 0);
|
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
array mlx_get_item_int(const array& src, const nb::int_& idx) {
|
2023-11-30 02:30:41 +08:00
|
|
|
// Check input and raise error if 0 dim for parity with np
|
|
|
|
if (src.ndim() == 0) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"too many indices for array: array is 0-dimensional");
|
|
|
|
}
|
|
|
|
|
|
|
|
// If only one input idx is mentioned, we set axis=0 in take
|
|
|
|
// for parity with np
|
|
|
|
return take(src, get_int_index(idx, src.shape(0)), 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
array mlx_gather_nd(
|
|
|
|
array src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const std::vector<nb::object>& indices,
|
2023-11-30 02:30:41 +08:00
|
|
|
bool gather_first,
|
|
|
|
int& max_dims) {
|
|
|
|
max_dims = 0;
|
|
|
|
std::vector<array> gather_indices;
|
|
|
|
std::vector<bool> is_slice(indices.size(), false);
|
|
|
|
int num_slices = 0;
|
|
|
|
// gather all the arrays
|
|
|
|
for (int i = 0; i < indices.size(); i++) {
|
|
|
|
auto& idx = indices[i];
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
if (nb::isinstance<nb::slice>(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
int start, end, stride;
|
2024-03-19 11:12:25 +08:00
|
|
|
get_slice_params(
|
|
|
|
start, end, stride, nb::cast<nb::slice>(idx), src.shape(i));
|
2023-12-21 02:44:01 +08:00
|
|
|
|
|
|
|
// Handle negative indices
|
|
|
|
start = (start < 0) ? start + src.shape(i) : start;
|
|
|
|
end = (end < 0) ? end + src.shape(i) : end;
|
|
|
|
|
2023-11-30 02:30:41 +08:00
|
|
|
gather_indices.push_back(arange(start, end, stride, uint32));
|
|
|
|
num_slices++;
|
|
|
|
is_slice[i] = true;
|
2024-03-19 11:12:25 +08:00
|
|
|
} else if (nb::isinstance<nb::int_>(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
gather_indices.push_back(get_int_index(idx, src.shape(i)));
|
2024-03-19 11:12:25 +08:00
|
|
|
} else if (nb::isinstance<array>(idx)) {
|
|
|
|
auto arr = nb::cast<array>(idx);
|
2023-11-30 02:30:41 +08:00
|
|
|
max_dims = std::max(static_cast<int>(arr.ndim()), max_dims);
|
|
|
|
gather_indices.push_back(arr);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// reshape them so that the int/array indices are first
|
|
|
|
if (gather_first) {
|
|
|
|
int slice_index = 0;
|
|
|
|
for (int i = 0; i < gather_indices.size(); i++) {
|
|
|
|
if (is_slice[i]) {
|
|
|
|
std::vector<int> index_shape(max_dims + num_slices, 1);
|
|
|
|
index_shape[max_dims + slice_index] = gather_indices[i].shape(0);
|
|
|
|
gather_indices[i] = reshape(gather_indices[i], index_shape);
|
|
|
|
slice_index++;
|
|
|
|
} else {
|
|
|
|
std::vector<int> index_shape = gather_indices[i].shape();
|
|
|
|
index_shape.insert(index_shape.end(), num_slices, 1);
|
|
|
|
gather_indices[i] = reshape(gather_indices[i], index_shape);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// reshape them so that the int/array indices are last
|
|
|
|
for (int i = 0; i < gather_indices.size(); i++) {
|
|
|
|
if (i < num_slices) {
|
|
|
|
std::vector<int> index_shape(max_dims + num_slices, 1);
|
|
|
|
index_shape[i] = gather_indices[i].shape(0);
|
|
|
|
gather_indices[i] = reshape(gather_indices[i], index_shape);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Do the gather
|
|
|
|
std::vector<int> axes(indices.size());
|
|
|
|
std::iota(axes.begin(), axes.end(), 0);
|
|
|
|
std::vector<int> slice_sizes = src.shape();
|
|
|
|
std::fill(slice_sizes.begin(), slice_sizes.begin() + indices.size(), 1);
|
|
|
|
src = gather(src, gather_indices, axes, slice_sizes);
|
|
|
|
|
|
|
|
// Squeeze the dims
|
|
|
|
std::vector<int> out_shape;
|
|
|
|
out_shape.insert(
|
|
|
|
out_shape.end(),
|
|
|
|
src.shape().begin(),
|
|
|
|
src.shape().begin() + max_dims + num_slices);
|
|
|
|
out_shape.insert(
|
|
|
|
out_shape.end(),
|
|
|
|
src.shape().begin() + max_dims + num_slices + indices.size(),
|
|
|
|
src.shape().end());
|
|
|
|
src = reshape(src, out_shape);
|
|
|
|
|
|
|
|
return src;
|
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
array mlx_get_item_nd(array src, const nb::tuple& entries) {
|
2023-11-30 02:30:41 +08:00
|
|
|
// No indices make this a noop
|
|
|
|
if (entries.size() == 0) {
|
|
|
|
return src;
|
|
|
|
}
|
|
|
|
|
|
|
|
// The plan is as follows:
|
|
|
|
// 1. Replace the ellipsis with a series of slice(None)
|
|
|
|
// 2. Loop over the indices and calculate the gather indices
|
|
|
|
// 3. Calculate the remaining slices and reshapes
|
|
|
|
|
|
|
|
// Ellipsis handling
|
2024-03-19 11:12:25 +08:00
|
|
|
std::vector<nb::object> indices;
|
2023-11-30 02:30:41 +08:00
|
|
|
{
|
|
|
|
int non_none_indices_before = 0;
|
|
|
|
int non_none_indices_after = 0;
|
2024-03-19 11:12:25 +08:00
|
|
|
std::vector<nb::object> r_indices;
|
2023-11-30 02:30:41 +08:00
|
|
|
int i = 0;
|
|
|
|
for (; i < entries.size(); i++) {
|
|
|
|
auto idx = entries[i];
|
|
|
|
if (!is_valid_index_type(idx)) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"Cannot index mlx array using the given type yet");
|
|
|
|
}
|
2024-03-19 11:12:25 +08:00
|
|
|
if (!nb::ellipsis().is(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
indices.push_back(idx);
|
|
|
|
non_none_indices_before += !idx.is_none();
|
|
|
|
} else {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
for (int j = entries.size() - 1; j > i; j--) {
|
|
|
|
auto idx = entries[j];
|
|
|
|
if (!is_valid_index_type(idx)) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"Cannot index mlx array using the given type yet");
|
|
|
|
}
|
2024-03-19 11:12:25 +08:00
|
|
|
if (nb::ellipsis().is(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
throw std::invalid_argument(
|
|
|
|
"An index can only have a single ellipsis (...)");
|
|
|
|
}
|
|
|
|
r_indices.push_back(idx);
|
|
|
|
non_none_indices_after += !idx.is_none();
|
|
|
|
}
|
|
|
|
for (int axis = non_none_indices_before;
|
|
|
|
axis < src.ndim() - non_none_indices_after;
|
|
|
|
axis++) {
|
2024-03-19 11:12:25 +08:00
|
|
|
indices.push_back(nb::slice(0, src.shape(axis), 1));
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
indices.insert(indices.end(), r_indices.rbegin(), r_indices.rend());
|
|
|
|
}
|
|
|
|
|
|
|
|
// Check for the number of indices passed
|
|
|
|
{
|
|
|
|
int cnt = src.ndim();
|
|
|
|
for (auto& idx : indices) {
|
|
|
|
if (!idx.is_none()) {
|
|
|
|
cnt--;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (cnt < 0) {
|
|
|
|
std::ostringstream msg;
|
|
|
|
msg << "Too many indices for array with " << src.ndim() << "dimensions.";
|
|
|
|
throw std::invalid_argument(msg.str());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Gather handling
|
|
|
|
//
|
|
|
|
// Check whether we have arrays or integer indices and delegate to gather_nd
|
|
|
|
// after removing the slices at the end and all Nones.
|
2024-03-19 11:12:25 +08:00
|
|
|
std::vector<nb::object> remaining_indices;
|
2023-11-30 02:30:41 +08:00
|
|
|
bool have_array = false;
|
|
|
|
{
|
|
|
|
// First check whether the results of gather are going to be 1st or
|
|
|
|
// normally in between.
|
|
|
|
bool have_non_array = false;
|
|
|
|
bool gather_first = false;
|
|
|
|
for (auto& idx : indices) {
|
2024-03-19 11:12:25 +08:00
|
|
|
if (nb::isinstance<array>(idx) || nb::isinstance<nb::int_>(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
if (have_array && have_non_array) {
|
|
|
|
gather_first = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
have_array = true;
|
|
|
|
} else {
|
|
|
|
have_non_array |= have_array;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (have_array) {
|
|
|
|
int last_array;
|
|
|
|
// Then find the last array
|
|
|
|
for (last_array = indices.size() - 1; last_array >= 0; last_array--) {
|
|
|
|
auto& idx = indices[last_array];
|
2024-03-19 11:12:25 +08:00
|
|
|
if (nb::isinstance<array>(idx) || nb::isinstance<nb::int_>(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
std::vector<nb::object> gather_indices;
|
2023-11-30 02:30:41 +08:00
|
|
|
for (int i = 0; i <= last_array; i++) {
|
|
|
|
auto& idx = indices[i];
|
|
|
|
if (!idx.is_none()) {
|
|
|
|
gather_indices.push_back(idx);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
int max_dims;
|
|
|
|
src = mlx_gather_nd(src, gather_indices, gather_first, max_dims);
|
|
|
|
|
|
|
|
// Reassemble the indices for the slicing or reshaping if there are any
|
|
|
|
if (gather_first) {
|
|
|
|
for (int i = 0; i < max_dims; i++) {
|
|
|
|
remaining_indices.push_back(
|
2024-03-19 11:12:25 +08:00
|
|
|
nb::slice(nb::none(), nb::none(), nb::none()));
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
for (int i = 0; i < last_array; i++) {
|
|
|
|
auto& idx = indices[i];
|
|
|
|
if (idx.is_none()) {
|
|
|
|
remaining_indices.push_back(indices[i]);
|
2024-03-19 11:12:25 +08:00
|
|
|
} else if (nb::isinstance<nb::slice>(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
remaining_indices.push_back(
|
2024-03-19 11:12:25 +08:00
|
|
|
nb::slice(nb::none(), nb::none(), nb::none()));
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
for (int i = last_array + 1; i < indices.size(); i++) {
|
|
|
|
remaining_indices.push_back(indices[i]);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
for (int i = 0; i < indices.size(); i++) {
|
|
|
|
auto& idx = indices[i];
|
2024-03-19 11:12:25 +08:00
|
|
|
if (nb::isinstance<array>(idx) || nb::isinstance<nb::int_>(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
break;
|
|
|
|
} else if (idx.is_none()) {
|
|
|
|
remaining_indices.push_back(idx);
|
|
|
|
} else {
|
|
|
|
remaining_indices.push_back(
|
2024-03-19 11:12:25 +08:00
|
|
|
nb::slice(nb::none(), nb::none(), nb::none()));
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
for (int i = 0; i < max_dims; i++) {
|
|
|
|
remaining_indices.push_back(
|
2024-03-19 11:12:25 +08:00
|
|
|
nb::slice(nb::none(), nb::none(), nb::none()));
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
for (int i = last_array + 1; i < indices.size(); i++) {
|
|
|
|
remaining_indices.push_back(indices[i]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (have_array && remaining_indices.empty()) {
|
|
|
|
return src;
|
|
|
|
}
|
|
|
|
if (remaining_indices.empty()) {
|
|
|
|
remaining_indices = indices;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Slice handling
|
|
|
|
{
|
|
|
|
std::vector<int> starts(src.ndim(), 0);
|
|
|
|
std::vector<int> ends = src.shape();
|
|
|
|
std::vector<int> strides(src.ndim(), 1);
|
|
|
|
int axis = 0;
|
|
|
|
for (auto& idx : remaining_indices) {
|
|
|
|
if (!idx.is_none()) {
|
|
|
|
get_slice_params(
|
2024-03-19 11:12:25 +08:00
|
|
|
starts[axis],
|
|
|
|
ends[axis],
|
|
|
|
strides[axis],
|
|
|
|
nb::cast<nb::slice>(idx),
|
|
|
|
ends[axis]);
|
2023-11-30 02:30:41 +08:00
|
|
|
axis++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
src = slice(src, starts, ends, strides);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Unsqueeze handling
|
|
|
|
if (remaining_indices.size() > src.ndim()) {
|
|
|
|
std::vector<int> out_shape;
|
|
|
|
int axis = 0;
|
|
|
|
for (auto& idx : remaining_indices) {
|
|
|
|
if (idx.is_none()) {
|
|
|
|
out_shape.push_back(1);
|
|
|
|
} else {
|
|
|
|
out_shape.push_back(src.shape(axis++));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
src = reshape(src, out_shape);
|
|
|
|
}
|
|
|
|
|
|
|
|
return src;
|
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
array mlx_get_item(const array& src, const nb::object& obj) {
|
|
|
|
if (nb::isinstance<nb::slice>(obj)) {
|
|
|
|
return mlx_get_item_slice(src, nb::cast<nb::slice>(obj));
|
|
|
|
} else if (nb::isinstance<array>(obj)) {
|
|
|
|
return mlx_get_item_array(src, nb::cast<array>(obj));
|
|
|
|
} else if (nb::isinstance<nb::int_>(obj)) {
|
|
|
|
return mlx_get_item_int(src, nb::cast<nb::int_>(obj));
|
|
|
|
} else if (nb::isinstance<nb::tuple>(obj)) {
|
|
|
|
return mlx_get_item_nd(src, nb::cast<nb::tuple>(obj));
|
|
|
|
} else if (nb::isinstance<nb::ellipsis>(obj)) {
|
|
|
|
return src;
|
2023-11-30 02:30:41 +08:00
|
|
|
} else if (obj.is_none()) {
|
|
|
|
std::vector<int> s(1, 1);
|
|
|
|
s.insert(s.end(), src.shape().begin(), src.shape().end());
|
|
|
|
return reshape(src, s);
|
|
|
|
}
|
|
|
|
throw std::invalid_argument("Cannot index mlx array using the given type.");
|
|
|
|
}
|
|
|
|
|
2024-01-10 05:36:51 +08:00
|
|
|
std::tuple<std::vector<array>, array, std::vector<int>> mlx_scatter_args_int(
|
2023-11-30 02:30:41 +08:00
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::int_& idx,
|
2023-11-30 02:30:41 +08:00
|
|
|
const array& update) {
|
|
|
|
if (src.ndim() == 0) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"too many indices for array: array is 0-dimensional");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Remove any leading singleton dimensions from the update
|
|
|
|
// and then broadcast update to shape of src[0, ...]
|
|
|
|
int s = 0;
|
|
|
|
for (; s < update.ndim() && update.shape(s) == 1; s++)
|
|
|
|
;
|
|
|
|
auto up_shape =
|
|
|
|
std::vector<int>(update.shape().begin() + s, update.shape().end());
|
|
|
|
auto shape = src.shape();
|
|
|
|
shape[0] = 1;
|
2024-01-10 05:36:51 +08:00
|
|
|
|
|
|
|
return {
|
|
|
|
{get_int_index(idx, src.shape(0))},
|
2023-11-30 02:30:41 +08:00
|
|
|
broadcast_to(reshape(update, up_shape), shape),
|
2024-01-10 05:36:51 +08:00
|
|
|
{0}};
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
2024-01-10 05:36:51 +08:00
|
|
|
std::tuple<std::vector<array>, array, std::vector<int>> mlx_scatter_args_array(
|
2023-11-30 02:30:41 +08:00
|
|
|
const array& src,
|
|
|
|
const array& indices,
|
|
|
|
const array& update) {
|
|
|
|
if (src.ndim() == 0) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"too many indices for array: array is 0-dimensional");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Remove any leading singleton dimensions from the update
|
|
|
|
int s = 0;
|
|
|
|
for (; s < update.ndim() && update.shape(s) == 1; s++)
|
|
|
|
;
|
|
|
|
auto up_shape =
|
|
|
|
std::vector<int>(update.shape().begin() + s, update.shape().end());
|
|
|
|
auto up = reshape(update, up_shape);
|
|
|
|
|
|
|
|
// The update shape must broadcast with indices.shape + [1] + src.shape[1:]
|
|
|
|
up_shape = indices.shape();
|
|
|
|
up_shape.insert(up_shape.end(), src.shape().begin() + 1, src.shape().end());
|
|
|
|
up = broadcast_to(up, up_shape);
|
|
|
|
up_shape.insert(up_shape.begin() + indices.ndim(), 1);
|
|
|
|
up = reshape(up, up_shape);
|
|
|
|
|
2024-01-10 05:36:51 +08:00
|
|
|
return {{indices}, up, {0}};
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
2024-01-10 05:36:51 +08:00
|
|
|
std::tuple<std::vector<array>, array, std::vector<int>> mlx_scatter_args_slice(
|
2023-11-30 02:30:41 +08:00
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::slice& in_slice,
|
2023-11-30 02:30:41 +08:00
|
|
|
const array& update) {
|
|
|
|
// Check input and raise error if 0 dim for parity with np
|
|
|
|
if (src.ndim() == 0) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"too many indices for array: array is 0-dimensional");
|
|
|
|
}
|
|
|
|
|
|
|
|
// If none slice is requested broadcast the update
|
|
|
|
// to the src size and return it.
|
|
|
|
if (is_none_slice(in_slice)) {
|
|
|
|
int s = 0;
|
|
|
|
for (; s < update.ndim() && update.shape(s) == 1; s++)
|
|
|
|
;
|
|
|
|
auto up_shape =
|
|
|
|
std::vector<int>(update.shape().begin() + s, update.shape().end());
|
2024-01-10 05:36:51 +08:00
|
|
|
return {{}, broadcast_to(reshape(update, up_shape), src.shape()), {}};
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
int start = 0;
|
|
|
|
int end = src.shape(0);
|
|
|
|
int stride = 1;
|
|
|
|
|
|
|
|
// Check and update slice params
|
|
|
|
get_slice_params(start, end, stride, in_slice, end);
|
|
|
|
|
2024-01-10 05:36:51 +08:00
|
|
|
return mlx_scatter_args_array(
|
|
|
|
src, arange(start, end, stride, uint32), update);
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
2024-01-10 05:36:51 +08:00
|
|
|
std::tuple<std::vector<array>, array, std::vector<int>> mlx_scatter_args_nd(
|
2023-11-30 02:30:41 +08:00
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::tuple& entries,
|
2023-11-30 02:30:41 +08:00
|
|
|
const array& update) {
|
2024-03-19 11:12:25 +08:00
|
|
|
std::vector<nb::object> indices;
|
2023-11-30 02:30:41 +08:00
|
|
|
int non_none_indices = 0;
|
|
|
|
|
|
|
|
// Expand ellipses into a series of ':' slices
|
|
|
|
{
|
|
|
|
int non_none_indices_before = 0;
|
|
|
|
int non_none_indices_after = 0;
|
|
|
|
bool has_ellipsis = false;
|
|
|
|
int indices_before = 0;
|
|
|
|
for (int i = 0; i < entries.size(); ++i) {
|
|
|
|
auto idx = entries[i];
|
|
|
|
if (!is_valid_index_type(idx)) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"Cannot index mlx array using the given type yet");
|
2024-03-19 11:12:25 +08:00
|
|
|
} else if (!nb::ellipsis().is(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
if (!has_ellipsis) {
|
|
|
|
indices_before++;
|
|
|
|
non_none_indices_before += !idx.is_none();
|
|
|
|
} else {
|
|
|
|
non_none_indices_after += !idx.is_none();
|
|
|
|
}
|
|
|
|
indices.push_back(idx);
|
|
|
|
} else if (has_ellipsis) {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"An index can only have a single ellipsis (...)");
|
|
|
|
} else {
|
|
|
|
has_ellipsis = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (has_ellipsis) {
|
|
|
|
for (int axis = non_none_indices_before;
|
|
|
|
axis < src.ndim() - non_none_indices_after;
|
|
|
|
axis++) {
|
|
|
|
indices.insert(
|
2024-03-19 11:12:25 +08:00
|
|
|
indices.begin() + indices_before, nb::slice(0, src.shape(axis), 1));
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
non_none_indices = src.ndim();
|
|
|
|
} else {
|
|
|
|
non_none_indices = non_none_indices_before + non_none_indices_after;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (non_none_indices > src.ndim()) {
|
|
|
|
std::ostringstream msg;
|
|
|
|
msg << "Too many indices for array with " << src.ndim() << "dimensions.";
|
|
|
|
throw std::invalid_argument(msg.str());
|
|
|
|
}
|
|
|
|
|
|
|
|
// Remove leading singletons dimensions from the update
|
|
|
|
int s = 0;
|
|
|
|
for (; s < update.ndim() && update.shape(s) == 1; s++) {
|
|
|
|
};
|
|
|
|
auto up_shape =
|
|
|
|
std::vector<int>(update.shape().begin() + s, update.shape().end());
|
|
|
|
auto up = reshape(update, up_shape);
|
|
|
|
|
|
|
|
// If no non-None indices return the broadcasted update
|
|
|
|
if (non_none_indices == 0) {
|
2024-01-10 05:36:51 +08:00
|
|
|
return {{}, broadcast_to(up, src.shape()), {}};
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
unsigned long max_dim = 0;
|
|
|
|
bool arrays_first = false;
|
|
|
|
int num_slices = 0;
|
|
|
|
int num_arrays = 0;
|
|
|
|
{
|
|
|
|
bool have_array = false;
|
|
|
|
bool have_non_array = false;
|
|
|
|
for (auto& idx : indices) {
|
2024-03-19 11:12:25 +08:00
|
|
|
if (nb::isinstance<nb::slice>(idx) || idx.is_none()) {
|
2023-11-30 02:30:41 +08:00
|
|
|
have_non_array = have_array;
|
|
|
|
num_slices++;
|
2024-03-19 11:12:25 +08:00
|
|
|
} else if (nb::isinstance<array>(idx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
have_array = true;
|
|
|
|
if (have_array && have_non_array) {
|
|
|
|
arrays_first = true;
|
|
|
|
}
|
2024-03-19 11:12:25 +08:00
|
|
|
max_dim = std::max(nb::cast<array>(idx).ndim(), max_dim);
|
2023-11-30 02:30:41 +08:00
|
|
|
num_arrays++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<array> arr_indices;
|
|
|
|
int slice_num = 0;
|
|
|
|
int array_num = 0;
|
|
|
|
int ax = 0;
|
|
|
|
for (int i = 0; i < indices.size(); ++i) {
|
|
|
|
auto& pyidx = indices[i];
|
2024-03-19 11:12:25 +08:00
|
|
|
if (nb::isinstance<nb::slice>(pyidx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
int start, end, stride;
|
2023-12-16 22:44:47 +08:00
|
|
|
auto axis_size = src.shape(ax++);
|
2024-03-19 11:12:25 +08:00
|
|
|
get_slice_params(
|
|
|
|
start, end, stride, nb::cast<nb::slice>(pyidx), axis_size);
|
2023-12-16 22:44:47 +08:00
|
|
|
|
|
|
|
// Handle negative indices
|
|
|
|
start = (start < 0) ? start + axis_size : start;
|
|
|
|
end = (end < 0) ? end + axis_size : end;
|
|
|
|
|
2023-11-30 02:30:41 +08:00
|
|
|
auto idx = arange(start, end, stride, uint32);
|
|
|
|
std::vector<int> idx_shape(max_dim + num_slices, 1);
|
|
|
|
auto loc = slice_num + (arrays_first ? max_dim : 0);
|
|
|
|
slice_num++;
|
|
|
|
idx_shape[loc] = idx.size();
|
|
|
|
arr_indices.push_back(reshape(idx, idx_shape));
|
2024-03-19 11:12:25 +08:00
|
|
|
} else if (nb::isinstance<nb::int_>(pyidx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
arr_indices.push_back(get_int_index(pyidx, src.shape(ax++)));
|
|
|
|
} else if (pyidx.is_none()) {
|
|
|
|
slice_num++;
|
2024-03-19 11:12:25 +08:00
|
|
|
} else if (nb::isinstance<array>(pyidx)) {
|
2023-11-30 02:30:41 +08:00
|
|
|
ax++;
|
2024-03-19 11:12:25 +08:00
|
|
|
auto idx = nb::cast<array>(pyidx);
|
2023-11-30 02:30:41 +08:00
|
|
|
std::vector<int> idx_shape;
|
|
|
|
if (!arrays_first) {
|
|
|
|
idx_shape.insert(idx_shape.end(), slice_num, 1);
|
|
|
|
}
|
|
|
|
idx_shape.insert(idx_shape.end(), max_dim - idx.ndim(), 1);
|
|
|
|
idx_shape.insert(idx_shape.end(), idx.shape().begin(), idx.shape().end());
|
|
|
|
idx_shape.insert(
|
|
|
|
idx_shape.end(), num_slices - (arrays_first ? 0 : slice_num), 1);
|
|
|
|
arr_indices.push_back(reshape(idx, idx_shape));
|
|
|
|
if (!arrays_first && ++array_num == num_arrays) {
|
|
|
|
slice_num += max_dim;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
throw std::invalid_argument(
|
|
|
|
"Cannot index mlx array using the given type yet");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
arr_indices = broadcast_arrays(arr_indices);
|
|
|
|
up_shape = arr_indices[0].shape();
|
|
|
|
up_shape.insert(
|
|
|
|
up_shape.end(),
|
|
|
|
src.shape().begin() + non_none_indices,
|
|
|
|
src.shape().end());
|
|
|
|
up = broadcast_to(up, up_shape);
|
|
|
|
up_shape.insert(
|
|
|
|
up_shape.begin() + arr_indices[0].ndim(), non_none_indices, 1);
|
|
|
|
up = reshape(up, up_shape);
|
|
|
|
|
|
|
|
std::vector<int> axes(arr_indices.size(), 0);
|
|
|
|
std::iota(axes.begin(), axes.end(), 0);
|
2024-01-10 05:36:51 +08:00
|
|
|
|
|
|
|
return {arr_indices, up, axes};
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|
|
|
|
|
2024-01-10 05:36:51 +08:00
|
|
|
std::tuple<std::vector<array>, array, std::vector<int>>
|
|
|
|
mlx_compute_scatter_args(
|
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::object& obj,
|
2024-01-10 05:36:51 +08:00
|
|
|
const ScalarOrArray& v) {
|
2023-11-30 02:30:41 +08:00
|
|
|
auto vals = to_array(v, src.dtype());
|
2024-03-19 11:12:25 +08:00
|
|
|
if (nb::isinstance<nb::slice>(obj)) {
|
|
|
|
return mlx_scatter_args_slice(src, nb::cast<nb::slice>(obj), vals);
|
|
|
|
} else if (nb::isinstance<array>(obj)) {
|
|
|
|
return mlx_scatter_args_array(src, nb::cast<array>(obj), vals);
|
|
|
|
} else if (nb::isinstance<nb::int_>(obj)) {
|
|
|
|
return mlx_scatter_args_int(src, nb::cast<nb::int_>(obj), vals);
|
|
|
|
} else if (nb::isinstance<nb::tuple>(obj)) {
|
|
|
|
return mlx_scatter_args_nd(src, nb::cast<nb::tuple>(obj), vals);
|
2024-01-10 05:36:51 +08:00
|
|
|
} else if (obj.is_none()) {
|
|
|
|
return {{}, broadcast_to(vals, src.shape()), {}};
|
|
|
|
}
|
|
|
|
throw std::invalid_argument("Cannot index mlx array using the given type.");
|
|
|
|
}
|
|
|
|
|
2024-03-19 11:12:25 +08:00
|
|
|
void mlx_set_item(array& src, const nb::object& obj, const ScalarOrArray& v) {
|
2024-01-10 05:36:51 +08:00
|
|
|
auto [indices, updates, axes] = mlx_compute_scatter_args(src, obj, v);
|
|
|
|
if (indices.size() > 0) {
|
|
|
|
auto out = scatter(src, indices, updates, axes);
|
|
|
|
src.overwrite_descriptor(out);
|
|
|
|
} else {
|
|
|
|
src.overwrite_descriptor(updates);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
array mlx_add_item(
|
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::object& obj,
|
2024-01-10 05:36:51 +08:00
|
|
|
const ScalarOrArray& v) {
|
|
|
|
auto [indices, updates, axes] = mlx_compute_scatter_args(src, obj, v);
|
|
|
|
if (indices.size() > 0) {
|
|
|
|
return scatter_add(src, indices, updates, axes);
|
|
|
|
} else {
|
|
|
|
return src + updates;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
array mlx_subtract_item(
|
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::object& obj,
|
2024-01-10 05:36:51 +08:00
|
|
|
const ScalarOrArray& v) {
|
|
|
|
auto [indices, updates, axes] = mlx_compute_scatter_args(src, obj, v);
|
|
|
|
if (indices.size() > 0) {
|
|
|
|
return scatter_add(src, indices, -updates, axes);
|
|
|
|
} else {
|
|
|
|
return src - updates;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
array mlx_multiply_item(
|
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::object& obj,
|
2024-01-10 05:36:51 +08:00
|
|
|
const ScalarOrArray& v) {
|
|
|
|
auto [indices, updates, axes] = mlx_compute_scatter_args(src, obj, v);
|
|
|
|
if (indices.size() > 0) {
|
|
|
|
return scatter_prod(src, indices, updates, axes);
|
|
|
|
} else {
|
|
|
|
return src * updates;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
array mlx_divide_item(
|
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::object& obj,
|
2024-01-10 05:36:51 +08:00
|
|
|
const ScalarOrArray& v) {
|
|
|
|
auto [indices, updates, axes] = mlx_compute_scatter_args(src, obj, v);
|
|
|
|
if (indices.size() > 0) {
|
|
|
|
return scatter_prod(src, indices, reciprocal(updates), axes);
|
|
|
|
} else {
|
|
|
|
return src / updates;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
array mlx_maximum_item(
|
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::object& obj,
|
2024-01-10 05:36:51 +08:00
|
|
|
const ScalarOrArray& v) {
|
|
|
|
auto [indices, updates, axes] = mlx_compute_scatter_args(src, obj, v);
|
|
|
|
if (indices.size() > 0) {
|
|
|
|
return scatter_max(src, indices, updates, axes);
|
|
|
|
} else {
|
|
|
|
return maximum(src, updates);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
array mlx_minimum_item(
|
|
|
|
const array& src,
|
2024-03-19 11:12:25 +08:00
|
|
|
const nb::object& obj,
|
2024-01-10 05:36:51 +08:00
|
|
|
const ScalarOrArray& v) {
|
|
|
|
auto [indices, updates, axes] = mlx_compute_scatter_args(src, obj, v);
|
|
|
|
if (indices.size() > 0) {
|
|
|
|
return scatter_min(src, indices, updates, axes);
|
|
|
|
} else {
|
|
|
|
return minimum(src, updates);
|
|
|
|
}
|
2023-11-30 02:30:41 +08:00
|
|
|
}
|