[CUDA] Matmul utils initial commit (#2441)

This commit is contained in:
Angelos Katharopoulos
2025-08-01 14:22:25 -07:00
committed by GitHub
parent 86258f292f
commit be9bc96da4
32 changed files with 856 additions and 14 deletions

View File

@@ -130,6 +130,7 @@ void ternary_op_gpu_inplace(
cu::ternary_g_nd<Op, DType, IdxT, dims_constant()>,
num_blocks,
block_dims,
0,
a.data<bool>(),
b.data<DType>(),
c.data<DType>(),
@@ -146,6 +147,7 @@ void ternary_op_gpu_inplace(
cu::ternary_g<Op, DType, IdxT>,
num_blocks,
block_dims,
0,
a.data<bool>(),
b.data<DType>(),
c.data<DType>(),
@@ -168,6 +170,7 @@ void ternary_op_gpu_inplace(
cu::ternary_v<Op, DType, IdxT, N_READS>,
num_blocks,
block_dims,
0,
a.data<bool>(),
b.data<DType>(),
c.data<DType>(),