26 int64_t A_batch_stride,
27 int64_t B_batch_stride,
28 int64_t matrix_stride_out,
29 std::vector<array>& copies);
45 std::vector<array>& copies,
46 Shape batch_shape = {},
void steel_matmul_regular(const Stream &s, metal::Device &d, const array &a, const array &b, array &out, int M, int N, int K, int batch_size_out, int lda, int ldb, int ldd, bool transpose_a, bool transpose_b, Shape batch_shape, Strides batch_strides, int64_t A_batch_stride, int64_t B_batch_stride, int64_t matrix_stride_out, std::vector< array > &copies)
std::vector< ShapeElem > Shape
Definition array.h:21
std::vector< int64_t > Strides
Definition array.h:22
void steel_matmul(const Stream &s, metal::Device &d, const array &a, const array &b, array &out, int M, int N, int K, int batch_size_out, int lda, int ldb, bool transpose_a, bool transpose_b, std::vector< array > &copies, Shape batch_shape={}, Strides A_batch_stride={}, Strides B_batch_stride={})