|
template<typename T , typename out_mask_t , typename op_mask_t , const int BM, const int BN, const int SM, const int SN, const int TM, const int TN, const bool kDoNCBatch> |
void | gemv_masked (const device T *mat, const device T *in_vec, device T *out_vec, const constant int &in_vec_size, const constant int &out_vec_size, const constant int &marix_ld, const constant int &batch_ndim, const constant int *batch_shape, const constant size_t *vector_batch_stride, const constant size_t *matrix_batch_stride, const device out_mask_t *out_mask, const device op_mask_t *mat_mask, const device op_mask_t *vec_mask, const constant int *mask_strides, const constant size_t *mask_batch_strides, uint3 tid, uint3 lid, uint simd_gid, uint simd_lid) |
| Matrix vector multiplication.
|
|
template<typename T , typename out_mask_t , typename op_mask_t , const int BM, const int BN, const int SM, const int SN, const int TM, const int TN, const bool kDoNCBatch> |
void | gemv_t_masked (const device T *mat, const device T *in_vec, device T *out_vec, const constant int &in_vec_size, const constant int &out_vec_size, const constant int &marix_ld, const constant int &batch_ndim, const constant int *batch_shape, const constant size_t *vector_batch_stride, const constant size_t *matrix_batch_stride, const device out_mask_t *out_mask, const device op_mask_t *mat_mask, const device op_mask_t *vec_mask, const constant int *mask_strides, const constant size_t *mask_batch_strides, uint3 tid, uint3 lid, uint simd_gid, uint simd_lid) |
| Vector matrix multiplication.
|
|
template<typename T , typename out_mask_t , typename op_mask_t , const int BM, const int BN, const int SM, const int SN, const int TM, const int TN, const bool kDoNCBatch>
void gemv_masked |
( |
const device T * | mat, |
|
|
const device T * | in_vec, |
|
|
device T * | out_vec, |
|
|
const constant int & | in_vec_size, |
|
|
const constant int & | out_vec_size, |
|
|
const constant int & | marix_ld, |
|
|
const constant int & | batch_ndim, |
|
|
const constant int * | batch_shape, |
|
|
const constant size_t * | vector_batch_stride, |
|
|
const constant size_t * | matrix_batch_stride, |
|
|
const device out_mask_t * | out_mask, |
|
|
const device op_mask_t * | mat_mask, |
|
|
const device op_mask_t * | vec_mask, |
|
|
const constant int * | mask_strides, |
|
|
const constant size_t * | mask_batch_strides, |
|
|
uint3 | tid, |
|
|
uint3 | lid, |
|
|
uint | simd_gid, |
|
|
uint | simd_lid ) |
Matrix vector multiplication.
template<typename T , typename out_mask_t , typename op_mask_t , const int BM, const int BN, const int SM, const int SN, const int TM, const int TN, const bool kDoNCBatch>
void gemv_t_masked |
( |
const device T * | mat, |
|
|
const device T * | in_vec, |
|
|
device T * | out_vec, |
|
|
const constant int & | in_vec_size, |
|
|
const constant int & | out_vec_size, |
|
|
const constant int & | marix_ld, |
|
|
const constant int & | batch_ndim, |
|
|
const constant int * | batch_shape, |
|
|
const constant size_t * | vector_batch_stride, |
|
|
const constant size_t * | matrix_batch_stride, |
|
|
const device out_mask_t * | out_mask, |
|
|
const device op_mask_t * | mat_mask, |
|
|
const device op_mask_t * | vec_mask, |
|
|
const constant int * | mask_strides, |
|
|
const constant size_t * | mask_batch_strides, |
|
|
uint3 | tid, |
|
|
uint3 | lid, |
|
|
uint | simd_gid, |
|
|
uint | simd_lid ) |
Vector matrix multiplication.