2024-06-07 11:28:06 +08:00
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "https://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
< html xmlns = "http://www.w3.org/1999/xhtml" lang = "en-US" >
< head >
< meta http-equiv = "Content-Type" content = "text/xhtml;charset=UTF-8" / >
< meta http-equiv = "X-UA-Compatible" content = "IE=11" / >
< meta name = "generator" content = "Doxygen 1.10.0" / >
< meta name = "viewport" content = "width=device-width, initial-scale=1" / >
< title > MLX: mlx/backend/metal/kernels/steel/gemm/kernels/steel_gemm_masked.h File Reference< / title >
< link href = "tabs.css" rel = "stylesheet" type = "text/css" / >
< script type = "text/javascript" src = "jquery.js" > < / script >
< script type = "text/javascript" src = "dynsections.js" > < / script >
< script type = "text/javascript" src = "clipboard.js" > < / script >
< script type = "text/javascript" src = "cookie.js" > < / script >
< link href = "search/search.css" rel = "stylesheet" type = "text/css" / >
< script type = "text/javascript" src = "search/searchdata.js" > < / script >
< script type = "text/javascript" src = "search/search.js" > < / script >
< link href = "doxygen.css" rel = "stylesheet" type = "text/css" / >
< / head >
< body >
< div id = "top" > <!-- do not remove this div, it is closed by doxygen! -->
< div id = "titlearea" >
< table cellspacing = "0" cellpadding = "0" >
< tbody >
< tr id = "projectrow" >
< td id = "projectalign" >
< div id = "projectname" > MLX
< / div >
< / td >
< / tr >
< / tbody >
< / table >
< / div >
<!-- end header part -->
<!-- Generated by Doxygen 1.10.0 -->
< script type = "text/javascript" >
/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
var searchBox = new SearchBox("searchBox", "search/",'.html');
/* @license-end */
< / script >
< script type = "text/javascript" src = "menudata.js" > < / script >
< script type = "text/javascript" src = "menu.js" > < / script >
< script type = "text/javascript" >
/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
$(function() {
initMenu('',true,false,'search.php','Search');
$(function() { init_search(); });
});
/* @license-end */
< / script >
< div id = "main-nav" > < / div >
<!-- window showing the filter options -->
< div id = "MSearchSelectWindow"
onmouseover="return searchBox.OnSearchSelectShow()"
onmouseout="return searchBox.OnSearchSelectHide()"
onkeydown="return searchBox.OnSearchSelectKey(event)">
< / div >
<!-- iframe showing the search results (closed by default) -->
< div id = "MSearchResultsWindow" >
< div id = "MSearchResults" >
< div class = "SRPage" >
< div id = "SRIndex" >
< div id = "SRResults" > < / div >
< div class = "SRStatus" id = "Loading" > Loading...< / div >
< div class = "SRStatus" id = "Searching" > Searching...< / div >
< div class = "SRStatus" id = "NoMatches" > No Matches< / div >
< / div >
< / div >
< / div >
< / div >
< div id = "nav-path" class = "navpath" >
< ul >
< li class = "navelem" > < a class = "el" href = "dir_938ab0ecf10b8b860ff766c820f665fd.html" > mlx< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_1d446c9bd3c99228254c9484e0bc5c06.html" > backend< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_d0c977ea65824390717cdb7efc36c157.html" > metal< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_70a37effa88bcbd6b791977fa1e64356.html" > kernels< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_76215a6c54e2b67053e723fc2395583c.html" > steel< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_6768c99e6145fb9510ccdb40db8ede25.html" > gemm< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_9c555e3d0f5b8c3fb3a7397c81fd5bf9.html" > kernels< / a > < / li > < / ul >
< / div >
< / div > <!-- top -->
< div class = "header" >
< div class = "summary" >
< a href = "#nested-classes" > Classes< / a > |
< a href = "#typedef-members" > Typedefs< / a > |
< a href = "#func-members" > Functions< / a > < / div >
< div class = "headertitle" > < div class = "title" > steel_gemm_masked.h File Reference< / div > < / div >
< / div > <!-- header -->
< div class = "contents" >
< div class = "textblock" > < code > #include " < a class = "el" href = "steel_2defines_8h_source.html" > mlx/backend/metal/kernels/steel/defines.h< / a > " < / code > < br / >
< / div >
< p > < a href = "steel__gemm__masked_8h_source.html" > Go to the source code of this file.< / a > < / p >
< table class = "memberdecls" >
< tr class = "heading" > < td colspan = "2" > < h2 class = "groupheader" > < a id = "nested-classes" name = "nested-classes" > < / a >
Classes< / h2 > < / td > < / tr >
< tr class = "memitem:" > < td class = "memItemLeft" align = "right" valign = "top" > struct   < / td > < td class = "memItemRight" valign = "bottom" > < a class = "el" href = "struct___no_mask.html" > _NoMask< / a > < / td > < / tr >
< tr class = "separator:" > < td class = "memSeparator" colspan = "2" >   < / td > < / tr >
< tr class = "memitem:" > < td class = "memItemLeft" align = "right" valign = "top" > struct   < / td > < td class = "memItemRight" valign = "bottom" > < a class = "el" href = "struct_scale_op.html" > ScaleOp< OutT, InT > < / a > < / td > < / tr >
< tr class = "separator:" > < td class = "memSeparator" colspan = "2" >   < / td > < / tr >
< / table > < table class = "memberdecls" >
< tr class = "heading" > < td colspan = "2" > < h2 class = "groupheader" > < a id = "typedef-members" name = "typedef-members" > < / a >
Typedefs< / h2 > < / td > < / tr >
< tr class = "memitem:a1480c8cdff1cae1462a5a71632969bca" id = "r_a1480c8cdff1cae1462a5a71632969bca" > < td class = "memItemLeft" align = "right" valign = "top" > typedef struct < a class = "el" href = "struct___no_mask.html" > _NoMask< / a >   < / td > < td class = "memItemRight" valign = "bottom" > < a class = "el" href = "#a1480c8cdff1cae1462a5a71632969bca" > nomask_t< / a > < / td > < / tr >
< tr class = "separator:a1480c8cdff1cae1462a5a71632969bca" > < td class = "memSeparator" colspan = "2" >   < / td > < / tr >
< / table > < table class = "memberdecls" >
< tr class = "heading" > < td colspan = "2" > < h2 class = "groupheader" > < a id = "func-members" name = "func-members" > < / a >
Functions< / h2 > < / td > < / tr >
< tr class = "memitem:af805e998b2046ee30c2b4be813e3af97" id = "r_af805e998b2046ee30c2b4be813e3af97" > < td class = "memTemplParams" colspan = "2" > template< typename T , typename out_mask_t , typename op_mask_t , int BM, int BN, int BK, int WM, int WN, bool transpose_a, bool transpose_b, bool MN_aligned, bool K_aligned> < / td > < / tr >
< tr class = "memitem:af805e998b2046ee30c2b4be813e3af97" > < td class = "memTemplItemLeft" align = "right" valign = "top" > void  < / td > < td class = "memTemplItemRight" valign = "bottom" > < a class = "el" href = "#af805e998b2046ee30c2b4be813e3af97" > block_masked_gemm< / a > (const device T *A, const device T *B, device T *D, const constant < a class = "el" href = "structmlx_1_1steel_1_1_g_e_m_m_params.html" > GEMMParams< / a > *params, const constant int *batch_shape, const constant size_t *batch_strides, const device out_mask_t *out_mask, const device op_mask_t *lhs_mask, const device op_mask_t *rhs_mask, const constant int *mask_strides, uint simd_lane_id, uint simd_group_id, uint3 tid, uint3 lid)< / td > < / tr >
< tr class = "separator:af805e998b2046ee30c2b4be813e3af97" > < td class = "memSeparator" colspan = "2" >   < / td > < / tr >
< tr class = "memitem:a477932e2ae9d49366f7ede6db63f9cac" id = "r_a477932e2ae9d49366f7ede6db63f9cac" > < td class = "memTemplParams" colspan = "2" > template< typename T , int BM, int BN, int BK, int WM, int WN, bool transpose_a, bool transpose_b, bool MN_aligned, bool K_aligned, bool has_operand_mask = false> < / td > < / tr >
< tr class = "memitem:a477932e2ae9d49366f7ede6db63f9cac" > < td class = "memTemplItemLeft" align = "right" valign = "top" > void  < / td > < td class = "memTemplItemRight" valign = "bottom" > < a class = "el" href = "#a477932e2ae9d49366f7ede6db63f9cac" > block_masked_gemm< / a > (const device T *A, const device T *B, device T *D, const constant < a class = "el" href = "structmlx_1_1steel_1_1_g_e_m_m_params.html" > GEMMParams< / a > *params, const constant int *batch_shape, const constant size_t *batch_strides, const device bool *out_mask, const device bool *lhs_mask, const device bool *rhs_mask, const constant int *mask_strides, uint simd_lane_id, uint simd_group_id, uint3 tid, uint3 lid)< / td > < / tr >
< tr class = "separator:a477932e2ae9d49366f7ede6db63f9cac" > < td class = "memSeparator" colspan = "2" >   < / td > < / tr >
< / table >
< h2 class = "groupheader" > Typedef Documentation< / h2 >
< a id = "a1480c8cdff1cae1462a5a71632969bca" name = "a1480c8cdff1cae1462a5a71632969bca" > < / a >
< h2 class = "memtitle" > < span class = "permalink" > < a href = "#a1480c8cdff1cae1462a5a71632969bca" > ◆   < / a > < / span > nomask_t< / h2 >
< div class = "memitem" >
< div class = "memproto" >
< table class = "memname" >
< tr >
2024-08-11 00:24:35 +08:00
< td class = "memname" > typedef struct < a class = "el" href = "struct___no_mask.html" > _NoMask< / a > < a class = "el" href = "kernels_2gemv__masked_8h.html#a1480c8cdff1cae1462a5a71632969bca" > nomask_t< / a > < / td >
2024-06-07 11:28:06 +08:00
< / tr >
< / table >
< / div > < div class = "memdoc" >
< / div >
< / div >
< h2 class = "groupheader" > Function Documentation< / h2 >
< a id = "a477932e2ae9d49366f7ede6db63f9cac" name = "a477932e2ae9d49366f7ede6db63f9cac" > < / a >
< h2 class = "memtitle" > < span class = "permalink" > < a href = "#a477932e2ae9d49366f7ede6db63f9cac" > ◆   < / a > < / span > block_masked_gemm() < span class = "overload" > [1/2]< / span > < / h2 >
< div class = "memitem" >
< div class = "memproto" >
< div class = "memtemplate" >
template< typename T , int BM, int BN, int BK, int WM, int WN, bool transpose_a, bool transpose_b, bool MN_aligned, bool K_aligned, bool has_operand_mask = false> < / div >
< table class = "memname" >
< tr >
< td class = "memname" > void block_masked_gemm < / td >
< td > (< / td >
< td class = "paramtype" > const device T *< / td > < td class = "paramname" > < span class = "paramname" > < em > A< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const device T *< / td > < td class = "paramname" > < span class = "paramname" > < em > B< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > device T *< / td > < td class = "paramname" > < span class = "paramname" > < em > D< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const constant < a class = "el" href = "structmlx_1_1steel_1_1_g_e_m_m_params.html" > GEMMParams< / a > *< / td > < td class = "paramname" > < span class = "paramname" > < em > params< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const constant int *< / td > < td class = "paramname" > < span class = "paramname" > < em > batch_shape< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const constant size_t *< / td > < td class = "paramname" > < span class = "paramname" > < em > batch_strides< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const device bool *< / td > < td class = "paramname" > < span class = "paramname" > < em > out_mask< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const device bool *< / td > < td class = "paramname" > < span class = "paramname" > < em > lhs_mask< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const device bool *< / td > < td class = "paramname" > < span class = "paramname" > < em > rhs_mask< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const constant int *< / td > < td class = "paramname" > < span class = "paramname" > < em > mask_strides< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > uint< / td > < td class = "paramname" > < span class = "paramname" > < em > simd_lane_id< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > uint< / td > < td class = "paramname" > < span class = "paramname" > < em > simd_group_id< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > uint3< / td > < td class = "paramname" > < span class = "paramname" > < em > tid< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > uint3< / td > < td class = "paramname" > < span class = "paramname" > < em > lid< / em > < / span >   )< / td >
< / tr >
< / table >
< / div > < div class = "memdoc" >
< / div >
< / div >
< a id = "af805e998b2046ee30c2b4be813e3af97" name = "af805e998b2046ee30c2b4be813e3af97" > < / a >
< h2 class = "memtitle" > < span class = "permalink" > < a href = "#af805e998b2046ee30c2b4be813e3af97" > ◆   < / a > < / span > block_masked_gemm() < span class = "overload" > [2/2]< / span > < / h2 >
< div class = "memitem" >
< div class = "memproto" >
< div class = "memtemplate" >
template< typename T , typename out_mask_t , typename op_mask_t , int BM, int BN, int BK, int WM, int WN, bool transpose_a, bool transpose_b, bool MN_aligned, bool K_aligned> < / div >
< table class = "memname" >
< tr >
< td class = "memname" > void block_masked_gemm < / td >
< td > (< / td >
< td class = "paramtype" > const device T *< / td > < td class = "paramname" > < span class = "paramname" > < em > A< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const device T *< / td > < td class = "paramname" > < span class = "paramname" > < em > B< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > device T *< / td > < td class = "paramname" > < span class = "paramname" > < em > D< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const constant < a class = "el" href = "structmlx_1_1steel_1_1_g_e_m_m_params.html" > GEMMParams< / a > *< / td > < td class = "paramname" > < span class = "paramname" > < em > params< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const constant int *< / td > < td class = "paramname" > < span class = "paramname" > < em > batch_shape< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const constant size_t *< / td > < td class = "paramname" > < span class = "paramname" > < em > batch_strides< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const device out_mask_t *< / td > < td class = "paramname" > < span class = "paramname" > < em > out_mask< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const device op_mask_t *< / td > < td class = "paramname" > < span class = "paramname" > < em > lhs_mask< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const device op_mask_t *< / td > < td class = "paramname" > < span class = "paramname" > < em > rhs_mask< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > const constant int *< / td > < td class = "paramname" > < span class = "paramname" > < em > mask_strides< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > uint< / td > < td class = "paramname" > < span class = "paramname" > < em > simd_lane_id< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > uint< / td > < td class = "paramname" > < span class = "paramname" > < em > simd_group_id< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > uint3< / td > < td class = "paramname" > < span class = "paramname" > < em > tid< / em > , < / span > < / td >
< / tr >
< tr >
< td class = "paramkey" > < / td >
< td > < / td >
< td class = "paramtype" > uint3< / td > < td class = "paramname" > < span class = "paramname" > < em > lid< / em > < / span >   )< / td >
< / tr >
< / table >
< / div > < div class = "memdoc" >
< / div >
< / div >
< / div > <!-- contents -->
<!-- start footer part -->
< hr class = "footer" / > < address class = "footer" > < small >
Generated by  < a href = "https://www.doxygen.org/index.html" > < img class = "footer" src = "doxygen.svg" width = "104" height = "31" alt = "doxygen" / > < / a > 1.10.0
< / small > < / address >
< / body >
< / html >