fix to use c++ api

2025-12-16 01:49:05 +08:00 · 2025-04-20 12:55:58 +09:00
parent 876c1986e4
commit a7a96b0ad6
3 changed files with 85 additions and 78 deletions
--- a/python/mlx/utils.py
+++ b/python/mlx/utils.py
@@ -289,64 +289,3 @@ def tree_merge(tree_a, tree_b, merge_fn=None):
                )
            )
        return merge_fn(tree_a, tree_b)
 def broadcast_shapes(*shapes):
    """Broadcast shapes to the same size.
    Uses the same broadcasting rules as NumPy. The size of the trailing axes
    for both arrays in an operation must either be the same size or one of
    them must be one.
    Args:
        *shapes: The shapes to be broadcast against each other.
            Each shape should be a tuple or list of integers.
    Returns:
        A tuple of integers representing the broadcasted shape.
    Raises:
        ValueError: If the shapes cannot be broadcast according to broadcasting rules.
    Examples:
        >>> broadcast_shapes((1, 2, 3), (3,))
        (1, 2, 3)
        >>> broadcast_shapes((1, 2, 3), (4, 1, 3))
        (4, 2, 3)
        >>> broadcast_shapes((5, 1, 3), (1, 4, 3))
        (5, 4, 3)
    """
    if len(shapes) == 0:
        raise ValueError("No shapes provided")
    if len(shapes) == 1:
        return shapes[0]
    result = shapes[0]
    for shape in shapes[1:]:
        ndim1 = len(result)
        ndim2 = len(shape)
        ndim = max(ndim1, ndim2)
        diff = abs(ndim1 - ndim2)
        big = result if ndim1 > ndim2 else shape
        small = shape if ndim1 > ndim2 else result
        out_shape = []
        for i in range(ndim - 1, diff - 1, -1):
            a = big[i]
            b = small[i - diff]
            if a == b:
                out_shape.insert(0, a)
            elif a == 1 or b == 1:
                out_shape.insert(0, a * b)
            else:
                raise ValueError(
                    f"Shapes {result} and {shape} cannot be broadcast together"
                )
        for i in range(diff - 1, -1, -1):
            out_shape.insert(0, big[i])
        result = tuple(out_shape)
    return result
--- a/python/src/ops.cpp
+++ b/python/src/ops.cpp
@@ -5189,4 +5189,72 @@ void init_ops(nb::module_& m) {
      Returns:
        array: The row or col contiguous output.
    )pbdoc");
  m.def(
      "broadcast_shapes",
      [](const nb::args& shapes) {
        if (shapes.size() == 0) {
          throw std::invalid_argument(
              "broadcast_shapes expects a sequence of shapes");
        }
        std::vector<mx::Shape> shape_vec;
        shape_vec.reserve(shapes.size());
        for (size_t i = 0; i < shapes.size(); ++i) {
          mx::Shape shape;
          if (nb::isinstance<nb::tuple>(shapes[i])) {
            nb::tuple t = nb::cast<nb::tuple>(shapes[i]);
            for (size_t j = 0; j < t.size(); ++j) {
              shape.push_back(nb::cast<int>(t[j]));
            }
          } else if (nb::isinstance<nb::list>(shapes[i])) {
            nb::list l = nb::cast<nb::list>(shapes[i]);
            for (size_t j = 0; j < l.size(); ++j) {
              shape.push_back(nb::cast<int>(l[j]));
            }
          } else {
            throw std::invalid_argument(
                "broadcast_shapes expects a sequence of shapes");
          }
          shape_vec.push_back(shape);
        }
        if (shape_vec.empty()) {
          return nb::tuple();
        }
        mx::Shape result = shape_vec[0];
        for (size_t i = 1; i < shape_vec.size(); ++i) {
          result = mx::broadcast_shapes(result, shape_vec[i]);
        }
        auto py_list = nb::cast(result);
        return nb::tuple(py_list);
      },
      nb::sig("def broadcast_shapes(*shapes: Sequence[int]) -> Sequence[int]"),
      R"pbdoc(
        Broadcast shapes.
        Returns the shape that results from broadcasting the supplied array shapes
        against each other.
        Args:
            *shapes (Sequence[int]): The shapes to broadcast.
        Returns:
            tuple: The broadcasted shape.
        Raises:
            ValueError: If the shapes cannot be broadcast.
        Example:
            >>> mx.broadcast_shapes((1,), (3, 1))
            (3, 1)
            >>> mx.broadcast_shapes((6, 7), (5, 6, 1), (7,))
            (5, 6, 7)
            >>> mx.broadcast_shapes((5, 1, 4), (1, 3, 1))
            (5, 3, 4)
      )pbdoc");
 }
--- a/python/tests/test_broadcast.py
+++ b/python/tests/test_broadcast.py
@@ -1,44 +1,44 @@
 # Copyright © 2025 Apple Inc.
-import mlx.utils
+import mlx.core
 import mlx_tests
 class TestBroadcast(mlx_tests.MLXTestCase):
    def test_broadcast_shapes(self):
        # Basic broadcasting
-        self.assertEqual(mlx.utils.broadcast_shapes((1, 2, 3), (3,)), (1, 2, 3))
+        self.assertEqual(mlx.core.broadcast_shapes((1, 2, 3), (3,)), (1, 2, 3))
-        self.assertEqual(mlx.utils.broadcast_shapes((4, 1, 6), (5, 6)), (4, 5, 6))
+        self.assertEqual(mlx.core.broadcast_shapes((4, 1, 6), (5, 6)), (4, 5, 6))
-        self.assertEqual(mlx.utils.broadcast_shapes((5, 1, 4), (1, 3, 4)), (5, 3, 4))
+        self.assertEqual(mlx.core.broadcast_shapes((5, 1, 4), (1, 3, 4)), (5, 3, 4))
        # Multiple arguments
-        self.assertEqual(mlx.utils.broadcast_shapes((1, 1), (1, 8), (7, 1)), (7, 8))
+        self.assertEqual(mlx.core.broadcast_shapes((1, 1), (1, 8), (7, 1)), (7, 8))
        self.assertEqual(
-            mlx.utils.broadcast_shapes((6, 1, 5), (1, 7, 1), (6, 7, 5)), (6, 7, 5)
+            mlx.core.broadcast_shapes((6, 1, 5), (1, 7, 1), (6, 7, 5)), (6, 7, 5)
        )
        # Same shapes
-        self.assertEqual(mlx.utils.broadcast_shapes((3, 4, 5), (3, 4, 5)), (3, 4, 5))
+        self.assertEqual(mlx.core.broadcast_shapes((3, 4, 5), (3, 4, 5)), (3, 4, 5))
        # Single argument
-        self.assertEqual(mlx.utils.broadcast_shapes((2, 3)), (2, 3))
+        self.assertEqual(mlx.core.broadcast_shapes((2, 3)), (2, 3))
        # Empty shapes
-        self.assertEqual(mlx.utils.broadcast_shapes((), ()), ())
+        self.assertEqual(mlx.core.broadcast_shapes((), ()), ())
-        self.assertEqual(mlx.utils.broadcast_shapes((), (1,)), (1,))
+        self.assertEqual(mlx.core.broadcast_shapes((), (1,)), (1,))
-        self.assertEqual(mlx.utils.broadcast_shapes((1,), ()), (1,))
+        self.assertEqual(mlx.core.broadcast_shapes((1,), ()), (1,))
        # Broadcasting with zeroes
-        self.assertEqual(mlx.utils.broadcast_shapes((0,), (0,)), (0,))
+        self.assertEqual(mlx.core.broadcast_shapes((0,), (0,)), (0,))
-        self.assertEqual(mlx.utils.broadcast_shapes((1, 0, 5), (3, 1, 5)), (3, 0, 5))
+        self.assertEqual(mlx.core.broadcast_shapes((1, 0, 5), (3, 1, 5)), (3, 0, 5))
-        self.assertEqual(mlx.utils.broadcast_shapes((5, 0), (0, 5, 0)), (0, 5, 0))
+        self.assertEqual(mlx.core.broadcast_shapes((5, 0), (0, 5, 0)), (0, 5, 0))
        # Error cases
        with self.assertRaises(ValueError):
-            mlx.utils.broadcast_shapes((3, 4), (4, 3))
+            mlx.core.broadcast_shapes((3, 4), (4, 3))
        with self.assertRaises(ValueError):
-            mlx.utils.broadcast_shapes((2, 3, 4), (2, 5, 4))
+            mlx.core.broadcast_shapes((2, 3, 4), (2, 5, 4))
        with self.assertRaises(ValueError):
-            mlx.utils.broadcast_shapes()
+            mlx.core.broadcast_shapes()