2024-10-15 23:12:17 +08:00
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "https://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
< html xmlns = "http://www.w3.org/1999/xhtml" lang = "en-US" >
< head >
< meta http-equiv = "Content-Type" content = "text/xhtml;charset=UTF-8" / >
< meta http-equiv = "X-UA-Compatible" content = "IE=11" / >
< meta name = "generator" content = "Doxygen 1.12.0" / >
< meta name = "viewport" content = "width=device-width, initial-scale=1" / >
< title > MLX: mlx/backend/metal/kernels/utils.h Source File< / title >
< link href = "tabs.css" rel = "stylesheet" type = "text/css" / >
< script type = "text/javascript" src = "jquery.js" > < / script >
< script type = "text/javascript" src = "dynsections.js" > < / script >
< script type = "text/javascript" src = "clipboard.js" > < / script >
< link href = "navtree.css" rel = "stylesheet" type = "text/css" / >
< script type = "text/javascript" src = "resize.js" > < / script >
< script type = "text/javascript" src = "cookie.js" > < / script >
< link href = "search/search.css" rel = "stylesheet" type = "text/css" / >
< script type = "text/javascript" src = "search/searchdata.js" > < / script >
< script type = "text/javascript" src = "search/search.js" > < / script >
< link href = "doxygen.css" rel = "stylesheet" type = "text/css" / >
< / head >
< body >
< div id = "top" > <!-- do not remove this div, it is closed by doxygen! -->
< div id = "titlearea" >
< table cellspacing = "0" cellpadding = "0" >
< tbody >
< tr id = "projectrow" >
< td id = "projectalign" >
< div id = "projectname" > MLX
< / div >
< / td >
< / tr >
< / tbody >
< / table >
< / div >
<!-- end header part -->
<!-- Generated by Doxygen 1.12.0 -->
< script type = "text/javascript" >
/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
var searchBox = new SearchBox("searchBox", "search/",'.html');
/* @license-end */
< / script >
< script type = "text/javascript" >
/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
$(function() { codefold.init(0); });
/* @license-end */
< / script >
< script type = "text/javascript" src = "menudata.js" > < / script >
< script type = "text/javascript" src = "menu.js" > < / script >
< script type = "text/javascript" >
/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
$(function() {
initMenu('',true,false,'search.php','Search',false);
$(function() { init_search(); });
});
/* @license-end */
< / script >
< div id = "main-nav" > < / div >
< script type = "text/javascript" >
/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
$(function(){ initResizable(false); });
/* @license-end */
< / script >
<!-- window showing the filter options -->
< div id = "MSearchSelectWindow"
onmouseover="return searchBox.OnSearchSelectShow()"
onmouseout="return searchBox.OnSearchSelectHide()"
onkeydown="return searchBox.OnSearchSelectKey(event)">
< / div >
<!-- iframe showing the search results (closed by default) -->
< div id = "MSearchResultsWindow" >
< div id = "MSearchResults" >
< div class = "SRPage" >
< div id = "SRIndex" >
< div id = "SRResults" > < / div >
< div class = "SRStatus" id = "Loading" > Loading...< / div >
< div class = "SRStatus" id = "Searching" > Searching...< / div >
< div class = "SRStatus" id = "NoMatches" > No Matches< / div >
< / div >
< / div >
< / div >
< / div >
< div id = "nav-path" class = "navpath" >
< ul >
< li class = "navelem" > < a class = "el" href = "dir_938ab0ecf10b8b860ff766c820f665fd.html" > mlx< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_1d446c9bd3c99228254c9484e0bc5c06.html" > backend< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_d0c977ea65824390717cdb7efc36c157.html" > metal< / a > < / li > < li class = "navelem" > < a class = "el" href = "dir_70a37effa88bcbd6b791977fa1e64356.html" > kernels< / a > < / li > < / ul >
< / div >
< / div > <!-- top -->
< div id = "doc-content" >
< div class = "header" >
< div class = "headertitle" > < div class = "title" > utils.h< / div > < / div >
< / div > <!-- header -->
< div class = "contents" >
< a href = "backend_2metal_2kernels_2utils_8h.html" > Go to the documentation of this file.< / a > < div class = "fragment" > < div class = "line" > < a id = "l00001" name = "l00001" > < / a > < span class = "lineno" > 1< / span > < span class = "comment" > // Copyright © 2023-2024 Apple Inc.< / span > < / div >
< div class = "line" > < a id = "l00002" name = "l00002" > < / a > < span class = "lineno" > 2< / span > < / div >
< div class = "line" > < a id = "l00003" name = "l00003" > < / a > < span class = "lineno" > 3< / span > < span class = "preprocessor" > #pragma once< / span > < / div >
< div class = "line" > < a id = "l00004" name = "l00004" > < / a > < span class = "lineno" > 4< / span > < / div >
< div class = "line" > < a id = "l00005" name = "l00005" > < / a > < span class = "lineno" > 5< / span > < span class = "preprocessor" > #include < metal_math> < / span > < / div >
< div class = "line" > < a id = "l00006" name = "l00006" > < / a > < span class = "lineno" > 6< / span > < span class = "preprocessor" > #include " < a class = "code" href = "backend_2metal_2kernels_2bf16_8h.html" > mlx/backend/metal/kernels/bf16.h< / a > " < / span > < / div >
< div class = "line" > < a id = "l00007" name = "l00007" > < / a > < span class = "lineno" > 7< / span > < span class = "preprocessor" > #include " < a class = "code" href = "backend_2metal_2kernels_2complex_8h.html" > mlx/backend/metal/kernels/complex.h< / a > " < / span > < / div >
< div class = "line" > < a id = "l00008" name = "l00008" > < / a > < span class = "lineno" > 8< / span > < span class = "preprocessor" > #include " < a class = "code" href = "defines_8h.html" > mlx/backend/metal/kernels/defines.h< / a > " < / span > < / div >
< div class = "line" > < a id = "l00009" name = "l00009" > < / a > < span class = "lineno" > 9< / span > < / div >
< div class = "line" > < a id = "l00010" name = "l00010" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#acb8ddf4a29129846b673c50ba7078773" > 10< / a > < / span > < span class = "keyword" > typedef< / span > half < a class = "code hl_typedef" href = "backend_2metal_2kernels_2utils_8h.html#acb8ddf4a29129846b673c50ba7078773" > float16_t< / a > ;< / div >
< div class = "line" > < a id = "l00011" name = "l00011" > < / a > < span class = "lineno" > 11< / span > < / div >
< div class = "line" > < a id = "l00013" name = "l00013" > < / a > < span class = "lineno" > 13< / span > < span class = "comment" > // Type limits utils< / span > < / div >
< div class = "line" > < a id = "l00015" name = "l00015" > < / a > < span class = "lineno" > 15< / span > < / div >
< div class = "line" > < a id = "l00016" name = "l00016" > < / a > < span class = "lineno" > 16< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > U> < / div >
< div class = "foldopen" id = "foldopen00017" data-start = "{" data-end = "};" >
< div class = "line" > < a id = "l00017" name = "l00017" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits.html" > 17< / a > < / span > < span class = "keyword" > struct < / span > < a class = "code hl_struct" href = "struct_limits.html" > Limits< / a > {< / div >
< div class = "line" > < a id = "l00018" name = "l00018" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits.html#a2f0673b6f9da89ce1d64f9f3d74f50a8" > 18< / a > < / span > < span class = "keyword" > static< / span > < span class = "keyword" > const< / span > constant U < a class = "code hl_variable" href = "struct_limits.html#a2f0673b6f9da89ce1d64f9f3d74f50a8" > max< / a > = metal::numeric_limits< U> ::max();< / div >
< div class = "line" > < a id = "l00019" name = "l00019" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits.html#a6e81584ba65a4dc6ff9366b458e3a20e" > 19< / a > < / span > < span class = "keyword" > static< / span > < span class = "keyword" > const< / span > constant U < a class = "code hl_variable" href = "struct_limits.html#a6e81584ba65a4dc6ff9366b458e3a20e" > min< / a > = metal::numeric_limits< U> ::min();< / div >
< div class = "line" > < a id = "l00020" name = "l00020" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits.html#a5a3eae6d244fbea2aa7b9200001463e5" > 20< / a > < / span > < span class = "keyword" > static< / span > < span class = "keyword" > const< / span > constant U < a class = "code hl_variable" href = "struct_limits.html#a5a3eae6d244fbea2aa7b9200001463e5" > finite_max< / a > = metal::numeric_limits< U> ::max();< / div >
< div class = "line" > < a id = "l00021" name = "l00021" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits.html#ae7469d21f2688797ca3e388d919ef05e" > 21< / a > < / span > < span class = "keyword" > static< / span > < span class = "keyword" > const< / span > constant U < a class = "code hl_variable" href = "struct_limits.html#ae7469d21f2688797ca3e388d919ef05e" > finite_min< / a > = metal::numeric_limits< U> ::min();< / div >
< div class = "line" > < a id = "l00022" name = "l00022" > < / a > < span class = "lineno" > 22< / span > };< / div >
< / div >
< div class = "line" > < a id = "l00023" name = "l00023" > < / a > < span class = "lineno" > 23< / span > < / div >
< div class = "foldopen" id = "foldopen00024" data-start = "" data-end = "" >
< div class = "line" > < a id = "l00024" name = "l00024" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > 24< / a > < / span > < span class = "preprocessor" > #define instantiate_default_limit(type) \< / span > < / div >
< div class = "line" > < a id = "l00025" name = "l00025" > < / a > < span class = "lineno" > 25< / span > < span class = "preprocessor" > template < > \< / span > < / div >
< div class = "line" > < a id = "l00026" name = "l00026" > < / a > < span class = "lineno" > 26< / span > < span class = "preprocessor" > struct Limits< type> { \< / span > < / div >
< div class = "line" > < a id = "l00027" name = "l00027" > < / a > < span class = "lineno" > 27< / span > < span class = "preprocessor" > static constexpr constant type max = metal::numeric_limits< type> ::max(); \< / span > < / div >
< div class = "line" > < a id = "l00028" name = "l00028" > < / a > < span class = "lineno" > 28< / span > < span class = "preprocessor" > static constexpr constant type min = metal::numeric_limits< type> ::min(); \< / span > < / div >
< div class = "line" > < a id = "l00029" name = "l00029" > < / a > < span class = "lineno" > 29< / span > < span class = "preprocessor" > static constexpr constant type finite_max = \< / span > < / div >
< div class = "line" > < a id = "l00030" name = "l00030" > < / a > < span class = "lineno" > 30< / span > < span class = "preprocessor" > metal::numeric_limits< type> ::max(); \< / span > < / div >
< div class = "line" > < a id = "l00031" name = "l00031" > < / a > < span class = "lineno" > 31< / span > < span class = "preprocessor" > static constexpr constant type finite_min = \< / span > < / div >
< div class = "line" > < a id = "l00032" name = "l00032" > < / a > < span class = "lineno" > 32< / span > < span class = "preprocessor" > metal::numeric_limits< type> ::min(); \< / span > < / div >
< div class = "line" > < a id = "l00033" name = "l00033" > < / a > < span class = "lineno" > 33< / span > < span class = "preprocessor" > };< / span > < / div >
< / div >
< div class = "line" > < a id = "l00034" name = "l00034" > < / a > < span class = "lineno" > 34< / span > < / div >
< div class = "line" > < a id = "l00035" name = "l00035" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01uint8__t_01_4.html#a55f48b89033e8c8683f8540ec6b23f02" > 35< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > (uint8_t);< / div >
< div class = "line" > < a id = "l00036" name = "l00036" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01uint16__t_01_4.html#a9d517d8265ea1898b6b16e91b8595146" > 36< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > (uint16_t);< / div >
< div class = "line" > < a id = "l00037" name = "l00037" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01uint32__t_01_4.html#a0698139f3fe440d7aa08ac5029d72235" > 37< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > (uint32_t);< / div >
< div class = "line" > < a id = "l00038" name = "l00038" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01uint64__t_01_4.html#aff101ff38be5ccdbb9790aecb3069071" > 38< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > (uint64_t);< / div >
< div class = "line" > < a id = "l00039" name = "l00039" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01int8__t_01_4.html#a24cdab873e0fb778393c69f1dc9ecf73" > 39< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > (int8_t);< / div >
< div class = "line" > < a id = "l00040" name = "l00040" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01int16__t_01_4.html#acb2936d1cdbf347a9a014c8e036a5782" > 40< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > (int16_t);< / div >
< div class = "line" > < a id = "l00041" name = "l00041" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01int32__t_01_4.html#aa9ed9f0e8c7400d8fc92e1cba9588794" > 41< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > (int32_t);< / div >
< div class = "line" > < a id = "l00042" name = "l00042" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01int64__t_01_4.html#a6c7254b641878fa0fb9538814c45457a" > 42< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > (int64_t);< / div >
< div class = "line" > < a id = "l00043" name = "l00043" > < / a > < span class = "lineno" > 43< / span > < / div >
< div class = "foldopen" id = "foldopen00044" data-start = "" data-end = "" >
< div class = "line" > < a id = "l00044" name = "l00044" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a1e520e23f58ca645dea1ac20998d987a" > 44< / a > < / span > < span class = "preprocessor" > #define instantiate_float_limit(type) \< / span > < / div >
< div class = "line" > < a id = "l00045" name = "l00045" > < / a > < span class = "lineno" > 45< / span > < span class = "preprocessor" > template < > \< / span > < / div >
< div class = "line" > < a id = "l00046" name = "l00046" > < / a > < span class = "lineno" > 46< / span > < span class = "preprocessor" > struct Limits< type> { \< / span > < / div >
< div class = "line" > < a id = "l00047" name = "l00047" > < / a > < span class = "lineno" > 47< / span > < span class = "preprocessor" > static constexpr constant type max = \< / span > < / div >
< div class = "line" > < a id = "l00048" name = "l00048" > < / a > < span class = "lineno" > 48< / span > < span class = "preprocessor" > metal::numeric_limits< type> ::infinity(); \< / span > < / div >
< div class = "line" > < a id = "l00049" name = "l00049" > < / a > < span class = "lineno" > 49< / span > < span class = "preprocessor" > static constexpr constant type min = \< / span > < / div >
< div class = "line" > < a id = "l00050" name = "l00050" > < / a > < span class = "lineno" > 50< / span > < span class = "preprocessor" > -metal::numeric_limits< type> ::infinity(); \< / span > < / div >
< div class = "line" > < a id = "l00051" name = "l00051" > < / a > < span class = "lineno" > 51< / span > < span class = "preprocessor" > static constexpr constant type finite_max = \< / span > < / div >
< div class = "line" > < a id = "l00052" name = "l00052" > < / a > < span class = "lineno" > 52< / span > < span class = "preprocessor" > metal::numeric_limits< type> ::max(); \< / span > < / div >
< div class = "line" > < a id = "l00053" name = "l00053" > < / a > < span class = "lineno" > 53< / span > < span class = "preprocessor" > static constexpr constant type finite_min = \< / span > < / div >
< div class = "line" > < a id = "l00054" name = "l00054" > < / a > < span class = "lineno" > 54< / span > < span class = "preprocessor" > -metal::numeric_limits< type> ::max(); \< / span > < / div >
< div class = "line" > < a id = "l00055" name = "l00055" > < / a > < span class = "lineno" > 55< / span > < span class = "preprocessor" > };< / span > < / div >
< / div >
< div class = "line" > < a id = "l00056" name = "l00056" > < / a > < span class = "lineno" > 56< / span > < / div >
< div class = "line" > < a id = "l00057" name = "l00057" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01half_01_4.html#aedaf0190aabf23da20510e558e2690b4" > 57< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#a1e520e23f58ca645dea1ac20998d987a" > instantiate_float_limit< / a > (half);< / div >
< div class = "line" > < a id = "l00058" name = "l00058" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01float_01_4.html#a291eea590113fc1858b7f83f2e0c977d" > 58< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#a1e520e23f58ca645dea1ac20998d987a" > instantiate_float_limit< / a > (< span class = "keywordtype" > float< / span > );< / div >
< div class = "line" > < a id = "l00059" name = "l00059" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01bfloat16__t_01_4.html#a6337dc35207b3f6f7185cd73eabac211" > 59< / a > < / span > < a class = "code hl_define" href = "backend_2metal_2kernels_2utils_8h.html#a1e520e23f58ca645dea1ac20998d987a" > instantiate_float_limit< / a > (< a class = "code hl_struct" href = "struct___m_l_x___b_float16.html" > bfloat16_t< / a > );< / div >
< div class = "line" > < a id = "l00060" name = "l00060" > < / a > < span class = "lineno" > 60< / span > < / div >
< div class = "line" > < a id = "l00061" name = "l00061" > < / a > < span class = "lineno" > 61< / span > < span class = "keyword" > template< / span > < > < / div >
< div class = "foldopen" id = "foldopen00062" data-start = "{" data-end = "};" >
< div class = "line" > < a id = "l00062" name = "l00062" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01bool_01_4.html" > 62< / a > < / span > < span class = "keyword" > struct < / span > < a class = "code hl_struct" href = "struct_limits.html" > Limits< / a > < bool> {< / div >
< div class = "line" > < a id = "l00063" name = "l00063" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01bool_01_4.html#acbd2132145888d51220558a101ffcff4" > 63< / a > < / span > < span class = "keyword" > static< / span > < span class = "keyword" > constexpr< / span > constant < span class = "keywordtype" > bool< / span > < a class = "code hl_variable" href = "struct_limits.html#a2f0673b6f9da89ce1d64f9f3d74f50a8" > max< / a > = < span class = "keyword" > true< / span > ;< / div >
< div class = "line" > < a id = "l00064" name = "l00064" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01bool_01_4.html#a139f787b57536d455490b8ef801d37cc" > 64< / a > < / span > < span class = "keyword" > static< / span > < span class = "keyword" > constexpr< / span > constant < span class = "keywordtype" > bool< / span > < a class = "code hl_variable" href = "struct_limits.html#a6e81584ba65a4dc6ff9366b458e3a20e" > min< / a > = < span class = "keyword" > false< / span > ;< / div >
< div class = "line" > < a id = "l00065" name = "l00065" > < / a > < span class = "lineno" > 65< / span > };< / div >
< / div >
< div class = "line" > < a id = "l00066" name = "l00066" > < / a > < span class = "lineno" > 66< / span > < / div >
< div class = "line" > < a id = "l00067" name = "l00067" > < / a > < span class = "lineno" > 67< / span > < span class = "keyword" > template< / span > < > < / div >
< div class = "foldopen" id = "foldopen00068" data-start = "{" data-end = "};" >
< div class = "line" > < a id = "l00068" name = "l00068" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01complex64__t_01_4.html" > 68< / a > < / span > < span class = "keyword" > struct < / span > < a class = "code hl_struct" href = "struct_limits.html" > Limits< / a > < < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > > {< / div >
< div class = "line" > < a id = "l00069" name = "l00069" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01complex64__t_01_4.html#ac01c274b224b90f5210b675a484f4607" > 69< / a > < / span > < span class = "keyword" > static< / span > < span class = "keyword" > constexpr< / span > constant < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > < a class = "code hl_variable" href = "struct_limits.html#a2f0673b6f9da89ce1d64f9f3d74f50a8" > max< / a > = < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > (< / div >
< div class = "line" > < a id = "l00070" name = "l00070" > < / a > < span class = "lineno" > 70< / span > metal::numeric_limits< float> ::infinity(),< / div >
< div class = "line" > < a id = "l00071" name = "l00071" > < / a > < span class = "lineno" > 71< / span > metal::numeric_limits< float> ::infinity());< / div >
< div class = "line" > < a id = "l00072" name = "l00072" > < / a > < span class = "lineno" > < a class = "line" href = "struct_limits_3_01complex64__t_01_4.html#aa67b04aa7abcd67f7af0808737ab8e14" > 72< / a > < / span > < span class = "keyword" > static< / span > < span class = "keyword" > constexpr< / span > constant < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > < a class = "code hl_variable" href = "struct_limits.html#a6e81584ba65a4dc6ff9366b458e3a20e" > min< / a > = < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > (< / div >
< div class = "line" > < a id = "l00073" name = "l00073" > < / a > < span class = "lineno" > 73< / span > -metal::numeric_limits< float> ::infinity(),< / div >
< div class = "line" > < a id = "l00074" name = "l00074" > < / a > < span class = "lineno" > 74< / span > -metal::numeric_limits< float> ::infinity());< / div >
< div class = "line" > < a id = "l00075" name = "l00075" > < / a > < span class = "lineno" > 75< / span > };< / div >
< / div >
< div class = "line" > < a id = "l00076" name = "l00076" > < / a > < span class = "lineno" > 76< / span > < / div >
< div class = "line" > < a id = "l00078" name = "l00078" > < / a > < span class = "lineno" > 78< / span > < span class = "comment" > // Indexing utils< / span > < / div >
< div class = "line" > < a id = "l00080" name = "l00080" > < / a > < span class = "lineno" > 80< / span > < / div >
< div class = "line" > < a id = "l00081" name = "l00081" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a069b682d7d21827461544817d722bfd3" > 81< / a > < / span > < span class = "preprocessor" > #define MLX_MTL_PRAGMA_UNROLL _Pragma(" clang loop unroll(full)" )< / span > < / div >
< div class = "line" > < a id = "l00082" name = "l00082" > < / a > < span class = "lineno" > 82< / span > < / div >
< div class = "line" > < a id = "l00084" name = "l00084" > < / a > < span class = "lineno" > 84< / span > < span class = "comment" > // Single Array with generic dims< / span > < / div >
< div class = "line" > < a id = "l00085" name = "l00085" > < / a > < span class = "lineno" > 85< / span > < / div >
< div class = "line" > < a id = "l00086" name = "l00086" > < / a > < span class = "lineno" > 86< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > str< span class = "keywordtype" > id< / span > e_t> < / div >
< div class = "foldopen" id = "foldopen00087" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00087" name = "l00087" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a8fd0c8fc6058e650fc99bca8b6acd7d1" > 87< / a > < / span > METAL_FUNC stride_t < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a8fd0c8fc6058e650fc99bca8b6acd7d1" > elem_to_loc< / a > (< / div >
< div class = "line" > < a id = "l00088" name = "l00088" > < / a > < span class = "lineno" > 88< / span > uint elem,< / div >
< div class = "line" > < a id = "l00089" name = "l00089" > < / a > < span class = "lineno" > 89< / span > constant < span class = "keyword" > const< / span > < span class = "keywordtype" > int< / span > * shape,< / div >
< div class = "line" > < a id = "l00090" name = "l00090" > < / a > < span class = "lineno" > 90< / span > constant < span class = "keyword" > const< / span > stride_t* strides,< / div >
< div class = "line" > < a id = "l00091" name = "l00091" > < / a > < span class = "lineno" > 91< / span > < span class = "keywordtype" > int< / span > ndim) {< / div >
< div class = "line" > < a id = "l00092" name = "l00092" > < / a > < span class = "lineno" > 92< / span > stride_t loc = 0;< / div >
< div class = "line" > < a id = "l00093" name = "l00093" > < / a > < span class = "lineno" > 93< / span > < span class = "keywordflow" > for< / span > (< span class = "keywordtype" > int< / span > i = ndim - 1; i > = 0 & & elem > 0; --i) {< / div >
< div class = "line" > < a id = "l00094" name = "l00094" > < / a > < span class = "lineno" > 94< / span > loc += (elem % shape[i]) * strides[i];< / div >
< div class = "line" > < a id = "l00095" name = "l00095" > < / a > < span class = "lineno" > 95< / span > elem /= shape[i];< / div >
< div class = "line" > < a id = "l00096" name = "l00096" > < / a > < span class = "lineno" > 96< / span > }< / div >
< div class = "line" > < a id = "l00097" name = "l00097" > < / a > < span class = "lineno" > 97< / span > < span class = "keywordflow" > return< / span > loc;< / div >
< div class = "line" > < a id = "l00098" name = "l00098" > < / a > < span class = "lineno" > 98< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00099" name = "l00099" > < / a > < span class = "lineno" > 99< / span > < / div >
< div class = "line" > < a id = "l00100" name = "l00100" > < / a > < span class = "lineno" > 100< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > str< span class = "keywordtype" > id< / span > e_t> < / div >
< div class = "foldopen" id = "foldopen00101" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00101" name = "l00101" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#aa6b041005351293e68e19b5abf1286cd" > 101< / a > < / span > METAL_FUNC stride_t < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a8fd0c8fc6058e650fc99bca8b6acd7d1" > elem_to_loc< / a > (< / div >
< div class = "line" > < a id = "l00102" name = "l00102" > < / a > < span class = "lineno" > 102< / span > stride_t elem,< / div >
< div class = "line" > < a id = "l00103" name = "l00103" > < / a > < span class = "lineno" > 103< / span > constant < span class = "keyword" > const< / span > < span class = "keywordtype" > int< / span > * shape,< / div >
< div class = "line" > < a id = "l00104" name = "l00104" > < / a > < span class = "lineno" > 104< / span > constant < span class = "keyword" > const< / span > stride_t* strides,< / div >
< div class = "line" > < a id = "l00105" name = "l00105" > < / a > < span class = "lineno" > 105< / span > < span class = "keywordtype" > int< / span > ndim) {< / div >
< div class = "line" > < a id = "l00106" name = "l00106" > < / a > < span class = "lineno" > 106< / span > stride_t loc = 0;< / div >
< div class = "line" > < a id = "l00107" name = "l00107" > < / a > < span class = "lineno" > 107< / span > < span class = "keywordflow" > for< / span > (< span class = "keywordtype" > int< / span > i = ndim - 1; i > = 0 & & elem > 0; --i) {< / div >
< div class = "line" > < a id = "l00108" name = "l00108" > < / a > < span class = "lineno" > 108< / span > loc += (elem % shape[i]) * strides[i];< / div >
< div class = "line" > < a id = "l00109" name = "l00109" > < / a > < span class = "lineno" > 109< / span > elem /= shape[i];< / div >
< div class = "line" > < a id = "l00110" name = "l00110" > < / a > < span class = "lineno" > 110< / span > }< / div >
< div class = "line" > < a id = "l00111" name = "l00111" > < / a > < span class = "lineno" > 111< / span > < span class = "keywordflow" > return< / span > loc;< / div >
< div class = "line" > < a id = "l00112" name = "l00112" > < / a > < span class = "lineno" > 112< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00113" name = "l00113" > < / a > < span class = "lineno" > 113< / span > < / div >
< div class = "line" > < a id = "l00114" name = "l00114" > < / a > < span class = "lineno" > 114< / span > < span class = "comment" > // Non templated version to handle arbitrary dims< / span > < / div >
< div class = "line" > < a id = "l00115" name = "l00115" > < / a > < span class = "lineno" > 115< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > str< span class = "keywordtype" > id< / span > e_t> < / div >
< div class = "foldopen" id = "foldopen00116" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00116" name = "l00116" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a37e00d94751710e81c9632bca2f91e51" > 116< / a > < / span > METAL_FUNC stride_t < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a8fd0c8fc6058e650fc99bca8b6acd7d1" > elem_to_loc< / a > (< / div >
< div class = "line" > < a id = "l00117" name = "l00117" > < / a > < span class = "lineno" > 117< / span > uint3 elem,< / div >
< div class = "line" > < a id = "l00118" name = "l00118" > < / a > < span class = "lineno" > 118< / span > constant < span class = "keyword" > const< / span > < span class = "keywordtype" > int< / span > * shape,< / div >
< div class = "line" > < a id = "l00119" name = "l00119" > < / a > < span class = "lineno" > 119< / span > constant < span class = "keyword" > const< / span > stride_t* strides,< / div >
< div class = "line" > < a id = "l00120" name = "l00120" > < / a > < span class = "lineno" > 120< / span > < span class = "keywordtype" > int< / span > ndim) {< / div >
< div class = "line" > < a id = "l00121" name = "l00121" > < / a > < span class = "lineno" > 121< / span > stride_t loc = elem.x * strides[ndim - 1] + elem.y * strides[ndim - 2];< / div >
< div class = "line" > < a id = "l00122" name = "l00122" > < / a > < span class = "lineno" > 122< / span > < span class = "keywordflow" > for< / span > (< span class = "keywordtype" > int< / span > d = ndim - 3; d > = 0; --d) {< / div >
< div class = "line" > < a id = "l00123" name = "l00123" > < / a > < span class = "lineno" > 123< / span > loc += (elem.z % shape[d]) * strides[d];< / div >
< div class = "line" > < a id = "l00124" name = "l00124" > < / a > < span class = "lineno" > 124< / span > elem.z /= shape[d];< / div >
< div class = "line" > < a id = "l00125" name = "l00125" > < / a > < span class = "lineno" > 125< / span > }< / div >
< div class = "line" > < a id = "l00126" name = "l00126" > < / a > < span class = "lineno" > 126< / span > < span class = "keywordflow" > return< / span > loc;< / div >
< div class = "line" > < a id = "l00127" name = "l00127" > < / a > < span class = "lineno" > 127< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00128" name = "l00128" > < / a > < span class = "lineno" > 128< / span > < / div >
< div class = "line" > < a id = "l00130" name = "l00130" > < / a > < span class = "lineno" > 130< / span > < span class = "comment" > // Single Array with fixed N dims< / span > < / div >
< div class = "line" > < a id = "l00131" name = "l00131" > < / a > < span class = "lineno" > 131< / span > < / div >
< div class = "line" > < a id = "l00132" name = "l00132" > < / a > < span class = "lineno" > 132< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > str< span class = "keywordtype" > id< / span > e_t> < / div >
< div class = "foldopen" id = "foldopen00133" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00133" name = "l00133" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a196a07022b812b241d4c06192c0fa83d" > 133< / a > < / span > METAL_FUNC stride_t < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a196a07022b812b241d4c06192c0fa83d" > elem_to_loc_1< / a > (uint elem, constant < span class = "keyword" > const< / span > stride_t& stride) {< / div >
< div class = "line" > < a id = "l00134" name = "l00134" > < / a > < span class = "lineno" > 134< / span > < span class = "keywordflow" > return< / span > elem * stride;< / div >
< div class = "line" > < a id = "l00135" name = "l00135" > < / a > < span class = "lineno" > 135< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00136" name = "l00136" > < / a > < span class = "lineno" > 136< / span > < / div >
< div class = "line" > < a id = "l00137" name = "l00137" > < / a > < span class = "lineno" > 137< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > str< span class = "keywordtype" > id< / span > e_t> < / div >
< div class = "line" > < a id = "l00138" name = "l00138" > < / a > < span class = "lineno" > 138< / span > METAL_FUNC < a class = "code hl_typedef" href = "namespacepocketfft_1_1detail.html#afb987c919e9424a996d0fc8b3c23cc84" > stride_t< / a > < / div >
< div class = "foldopen" id = "foldopen00139" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00139" name = "l00139" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#ad6c45cacca97899cd362df49c06fea79" > 139< / a > < / span > < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#ad6c45cacca97899cd362df49c06fea79" > elem_to_loc_2< / a > (uint2 elem, constant < span class = "keyword" > const< / span > stride_t strides[2]) {< / div >
< div class = "line" > < a id = "l00140" name = "l00140" > < / a > < span class = "lineno" > 140< / span > < span class = "keywordflow" > return< / span > elem.x * strides[1] + elem.y * strides[0];< / div >
< div class = "line" > < a id = "l00141" name = "l00141" > < / a > < span class = "lineno" > 141< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00142" name = "l00142" > < / a > < span class = "lineno" > 142< / span > < / div >
< div class = "line" > < a id = "l00143" name = "l00143" > < / a > < span class = "lineno" > 143< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > str< span class = "keywordtype" > id< / span > e_t> < / div >
< div class = "line" > < a id = "l00144" name = "l00144" > < / a > < span class = "lineno" > 144< / span > METAL_FUNC < a class = "code hl_typedef" href = "namespacepocketfft_1_1detail.html#afb987c919e9424a996d0fc8b3c23cc84" > stride_t< / a > < / div >
< div class = "foldopen" id = "foldopen00145" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00145" name = "l00145" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a2c34ed54714c69e6e1b44344f9e6e330" > 145< / a > < / span > < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a2c34ed54714c69e6e1b44344f9e6e330" > elem_to_loc_3< / a > (uint3 elem, constant < span class = "keyword" > const< / span > stride_t strides[3]) {< / div >
< div class = "line" > < a id = "l00146" name = "l00146" > < / a > < span class = "lineno" > 146< / span > < span class = "keywordflow" > return< / span > elem.x * strides[2] + elem.y * strides[1] + elem.z * strides[0];< / div >
< div class = "line" > < a id = "l00147" name = "l00147" > < / a > < span class = "lineno" > 147< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00148" name = "l00148" > < / a > < span class = "lineno" > 148< / span > < / div >
< div class = "line" > < a id = "l00150" name = "l00150" > < / a > < span class = "lineno" > 150< / span > < span class = "comment" > // Multiple Arrays with generic dims< / span > < / div >
< div class = "line" > < a id = "l00151" name = "l00151" > < / a > < span class = "lineno" > 151< / span > < / div >
< div class = "line" > < a id = "l00152" name = "l00152" > < / a > < span class = "lineno" > 152< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > str< span class = "keywordtype" > id< / span > e_t> < / div >
< div class = "foldopen" id = "foldopen00153" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00153" name = "l00153" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a01c9309978a6c12f79b6e4108728a953" > 153< / a > < / span > METAL_FUNC ulong2 < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a01c9309978a6c12f79b6e4108728a953" > elem_to_loc_2_nd< / a > (< / div >
< div class = "line" > < a id = "l00154" name = "l00154" > < / a > < span class = "lineno" > 154< / span > uint3 elem,< / div >
< div class = "line" > < a id = "l00155" name = "l00155" > < / a > < span class = "lineno" > 155< / span > constant < span class = "keyword" > const< / span > < span class = "keywordtype" > int< / span > * shape,< / div >
< div class = "line" > < a id = "l00156" name = "l00156" > < / a > < span class = "lineno" > 156< / span > constant < span class = "keyword" > const< / span > stride_t* a_strides,< / div >
< div class = "line" > < a id = "l00157" name = "l00157" > < / a > < span class = "lineno" > 157< / span > constant < span class = "keyword" > const< / span > stride_t* b_strides,< / div >
< div class = "line" > < a id = "l00158" name = "l00158" > < / a > < span class = "lineno" > 158< / span > < span class = "keywordtype" > int< / span > ndim) {< / div >
< div class = "line" > < a id = "l00159" name = "l00159" > < / a > < span class = "lineno" > 159< / span > ulong2 loc = {< / div >
< div class = "line" > < a id = "l00160" name = "l00160" > < / a > < span class = "lineno" > 160< / span > ulong(elem.x * a_strides[ndim - 1] + elem.y * a_strides[ndim - 2]),< / div >
< div class = "line" > < a id = "l00161" name = "l00161" > < / a > < span class = "lineno" > 161< / span > ulong(elem.x * b_strides[ndim - 1] + elem.y * b_strides[ndim - 2])};< / div >
< div class = "line" > < a id = "l00162" name = "l00162" > < / a > < span class = "lineno" > 162< / span > < span class = "keywordflow" > for< / span > (< span class = "keywordtype" > int< / span > d = ndim - 3; d > = 0; --d) {< / div >
< div class = "line" > < a id = "l00163" name = "l00163" > < / a > < span class = "lineno" > 163< / span > uint l = elem.z % shape[d];< / div >
< div class = "line" > < a id = "l00164" name = "l00164" > < / a > < span class = "lineno" > 164< / span > loc.x += l * a_strides[d];< / div >
< div class = "line" > < a id = "l00165" name = "l00165" > < / a > < span class = "lineno" > 165< / span > loc.y += l * b_strides[d];< / div >
< div class = "line" > < a id = "l00166" name = "l00166" > < / a > < span class = "lineno" > 166< / span > elem.z /= shape[d];< / div >
< div class = "line" > < a id = "l00167" name = "l00167" > < / a > < span class = "lineno" > 167< / span > }< / div >
< div class = "line" > < a id = "l00168" name = "l00168" > < / a > < span class = "lineno" > 168< / span > < span class = "keywordflow" > return< / span > loc;< / div >
< div class = "line" > < a id = "l00169" name = "l00169" > < / a > < span class = "lineno" > 169< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00170" name = "l00170" > < / a > < span class = "lineno" > 170< / span > < / div >
< div class = "foldopen" id = "foldopen00171" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00171" name = "l00171" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a66940b1cc3d64651d24634bc696d528b" > 171< / a > < / span > METAL_FUNC ulong3 < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a66940b1cc3d64651d24634bc696d528b" > elem_to_loc_3_nd< / a > (< / div >
< div class = "line" > < a id = "l00172" name = "l00172" > < / a > < span class = "lineno" > 172< / span > uint3 elem,< / div >
< div class = "line" > < a id = "l00173" name = "l00173" > < / a > < span class = "lineno" > 173< / span > constant < span class = "keyword" > const< / span > < span class = "keywordtype" > int< / span > * shape,< / div >
< div class = "line" > < a id = "l00174" name = "l00174" > < / a > < span class = "lineno" > 174< / span > constant < span class = "keyword" > const< / span > < span class = "keywordtype" > size_t< / span > * a_strides,< / div >
< div class = "line" > < a id = "l00175" name = "l00175" > < / a > < span class = "lineno" > 175< / span > constant < span class = "keyword" > const< / span > < span class = "keywordtype" > size_t< / span > * b_strides,< / div >
< div class = "line" > < a id = "l00176" name = "l00176" > < / a > < span class = "lineno" > 176< / span > constant < span class = "keyword" > const< / span > < span class = "keywordtype" > size_t< / span > * c_strides,< / div >
< div class = "line" > < a id = "l00177" name = "l00177" > < / a > < span class = "lineno" > 177< / span > < span class = "keywordtype" > int< / span > ndim) {< / div >
< div class = "line" > < a id = "l00178" name = "l00178" > < / a > < span class = "lineno" > 178< / span > ulong3 loc = {< / div >
< div class = "line" > < a id = "l00179" name = "l00179" > < / a > < span class = "lineno" > 179< / span > elem.x * a_strides[ndim - 1] + elem.y * a_strides[ndim - 2],< / div >
< div class = "line" > < a id = "l00180" name = "l00180" > < / a > < span class = "lineno" > 180< / span > elem.x * b_strides[ndim - 1] + elem.y * b_strides[ndim - 2],< / div >
< div class = "line" > < a id = "l00181" name = "l00181" > < / a > < span class = "lineno" > 181< / span > elem.x * c_strides[ndim - 1] + elem.y * c_strides[ndim - 2]};< / div >
< div class = "line" > < a id = "l00182" name = "l00182" > < / a > < span class = "lineno" > 182< / span > < span class = "keywordflow" > for< / span > (< span class = "keywordtype" > int< / span > d = ndim - 3; d > = 0; --d) {< / div >
< div class = "line" > < a id = "l00183" name = "l00183" > < / a > < span class = "lineno" > 183< / span > uint l = elem.z % shape[d];< / div >
< div class = "line" > < a id = "l00184" name = "l00184" > < / a > < span class = "lineno" > 184< / span > loc.x += l * a_strides[d];< / div >
< div class = "line" > < a id = "l00185" name = "l00185" > < / a > < span class = "lineno" > 185< / span > loc.y += l * b_strides[d];< / div >
< div class = "line" > < a id = "l00186" name = "l00186" > < / a > < span class = "lineno" > 186< / span > loc.z += l * c_strides[d];< / div >
< div class = "line" > < a id = "l00187" name = "l00187" > < / a > < span class = "lineno" > 187< / span > elem.z /= shape[d];< / div >
< div class = "line" > < a id = "l00188" name = "l00188" > < / a > < span class = "lineno" > 188< / span > }< / div >
< div class = "line" > < a id = "l00189" name = "l00189" > < / a > < span class = "lineno" > 189< / span > < span class = "keywordflow" > return< / span > loc;< / div >
< div class = "line" > < a id = "l00190" name = "l00190" > < / a > < span class = "lineno" > 190< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00191" name = "l00191" > < / a > < span class = "lineno" > 191< / span > < / div >
< div class = "line" > < a id = "l00193" name = "l00193" > < / a > < span class = "lineno" > 193< / span > < span class = "comment" > // Elem to loc in a loop utils< / span > < / div >
< div class = "line" > < a id = "l00195" name = "l00195" > < / a > < span class = "lineno" > 195< / span > < / div >
< div class = "line" > < a id = "l00196" name = "l00196" > < / a > < span class = "lineno" > 196< / span > < span class = "keyword" > template< / span > < < span class = "keywordtype" > int< / span > dim, < span class = "keyword" > typename< / span > offset_t = < span class = "keywordtype" > size_t< / span > > < / div >
< div class = "foldopen" id = "foldopen00197" data-start = "{" data-end = "};" >
< div class = "line" > < a id = "l00197" name = "l00197" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc.html" > 197< / a > < / span > < span class = "keyword" > struct < / span > < a class = "code hl_struct" href = "structlooped__elem__to__loc.html" > looped_elem_to_loc< / a > {< / div >
< div class = "line" > < a id = "l00198" name = "l00198" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc.html#a42c76764640618d721c48ef6b4f59189" > 198< / a > < / span > < a class = "code hl_struct" href = "structlooped__elem__to__loc.html" > looped_elem_to_loc< / a > < dim - 1, offset_t> < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a42c76764640618d721c48ef6b4f59189" > inner_looper< / a > ;< / div >
< div class = "line" > < a id = "l00199" name = "l00199" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > 199< / a > < / span > offset_t < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > {0};< / div >
< div class = "line" > < a id = "l00200" name = "l00200" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > 200< / a > < / span > < span class = "keywordtype" > int< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > index< / a > {0};< / div >
< div class = "line" > < a id = "l00201" name = "l00201" > < / a > < span class = "lineno" > 201< / span > < / div >
< div class = "foldopen" id = "foldopen00202" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00202" name = "l00202" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc.html#a05558dabba889ee0d80ed4b567d901ca" > 202< / a > < / span > < span class = "keywordtype" > void< / span > < a class = "code hl_function" href = "structlooped__elem__to__loc.html#a05558dabba889ee0d80ed4b567d901ca" > next< / a > (< span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > * shape, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > * strides) {< / div >
< div class = "line" > < a id = "l00203" name = "l00203" > < / a > < span class = "lineno" > 203< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > index< / a > ++;< / div >
< div class = "line" > < a id = "l00204" name = "l00204" > < / a > < span class = "lineno" > 204< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > += strides[dim - 1];< / div >
< div class = "line" > < a id = "l00205" name = "l00205" > < / a > < span class = "lineno" > 205< / span > < / div >
< div class = "line" > < a id = "l00206" name = "l00206" > < / a > < span class = "lineno" > 206< / span > < span class = "keywordflow" > if< / span > (< a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > index< / a > > = shape[dim - 1]) {< / div >
< div class = "line" > < a id = "l00207" name = "l00207" > < / a > < span class = "lineno" > 207< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > index< / a > = 0;< / div >
< div class = "line" > < a id = "l00208" name = "l00208" > < / a > < span class = "lineno" > 208< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a42c76764640618d721c48ef6b4f59189" > inner_looper< / a > .next(shape, strides);< / div >
< div class = "line" > < a id = "l00209" name = "l00209" > < / a > < span class = "lineno" > 209< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > = < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a42c76764640618d721c48ef6b4f59189" > inner_looper< / a > .offset;< / div >
< div class = "line" > < a id = "l00210" name = "l00210" > < / a > < span class = "lineno" > 210< / span > }< / div >
< div class = "line" > < a id = "l00211" name = "l00211" > < / a > < span class = "lineno" > 211< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00212" name = "l00212" > < / a > < span class = "lineno" > 212< / span > < / div >
< div class = "foldopen" id = "foldopen00213" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00213" name = "l00213" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc.html#add610f331ef8d7d2d1917050890f82b2" > 213< / a > < / span > < span class = "keywordtype" > void< / span > < a class = "code hl_function" href = "structlooped__elem__to__loc.html#add610f331ef8d7d2d1917050890f82b2" > next< / a > (< span class = "keywordtype" > int< / span > n, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > * shape, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > * strides) {< / div >
< div class = "line" > < a id = "l00214" name = "l00214" > < / a > < span class = "lineno" > 214< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > index< / a > += n;< / div >
< div class = "line" > < a id = "l00215" name = "l00215" > < / a > < span class = "lineno" > 215< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > += n * strides[dim - 1];< / div >
< div class = "line" > < a id = "l00216" name = "l00216" > < / a > < span class = "lineno" > 216< / span > < / div >
< div class = "line" > < a id = "l00217" name = "l00217" > < / a > < span class = "lineno" > 217< / span > < span class = "keywordflow" > if< / span > (< a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > index< / a > > = shape[dim - 1]) {< / div >
< div class = "line" > < a id = "l00218" name = "l00218" > < / a > < span class = "lineno" > 218< / span > < span class = "keywordtype" > int< / span > extra = < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > index< / a > - shape[dim - 1];< / div >
< div class = "line" > < a id = "l00219" name = "l00219" > < / a > < span class = "lineno" > 219< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > index< / a > = 0;< / div >
< div class = "line" > < a id = "l00220" name = "l00220" > < / a > < span class = "lineno" > 220< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a42c76764640618d721c48ef6b4f59189" > inner_looper< / a > .next(shape, strides);< / div >
< div class = "line" > < a id = "l00221" name = "l00221" > < / a > < span class = "lineno" > 221< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > = < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a42c76764640618d721c48ef6b4f59189" > inner_looper< / a > .offset;< / div >
< div class = "line" > < a id = "l00222" name = "l00222" > < / a > < span class = "lineno" > 222< / span > < span class = "keywordflow" > if< / span > (extra > 0) {< / div >
< div class = "line" > < a id = "l00223" name = "l00223" > < / a > < span class = "lineno" > 223< / span > < a class = "code hl_variable" href = "backend_2metal_2allocator_8h.html#ae704ab07eac590091daa5fc4aec7bddb" > next< / a > (extra, shape, strides);< / div >
< div class = "line" > < a id = "l00224" name = "l00224" > < / a > < span class = "lineno" > 224< / span > }< / div >
< div class = "line" > < a id = "l00225" name = "l00225" > < / a > < span class = "lineno" > 225< / span > }< / div >
< div class = "line" > < a id = "l00226" name = "l00226" > < / a > < span class = "lineno" > 226< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00227" name = "l00227" > < / a > < span class = "lineno" > 227< / span > < / div >
< div class = "line" > < a id = "l00228" name = "l00228" > < / a > < span class = "lineno" > 228< / span > offset_t< / div >
< div class = "foldopen" id = "foldopen00229" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00229" name = "l00229" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc.html#accc6d4957a8aeb38f5062754793b74d2" > 229< / a > < / span > < a class = "code hl_function" href = "structlooped__elem__to__loc.html#accc6d4957a8aeb38f5062754793b74d2" > location< / a > (offset_t, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > *, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > *, < span class = "keywordtype" > int< / span > ) {< / div >
< div class = "line" > < a id = "l00230" name = "l00230" > < / a > < span class = "lineno" > 230< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > ;< / div >
< div class = "line" > < a id = "l00231" name = "l00231" > < / a > < span class = "lineno" > 231< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00232" name = "l00232" > < / a > < span class = "lineno" > 232< / span > };< / div >
< / div >
< div class = "line" > < a id = "l00233" name = "l00233" > < / a > < span class = "lineno" > 233< / span > < / div >
< div class = "line" > < a id = "l00234" name = "l00234" > < / a > < span class = "lineno" > 234< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > offset_t> < / div >
< div class = "foldopen" id = "foldopen00235" data-start = "{" data-end = "};" >
< div class = "line" > < a id = "l00235" name = "l00235" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html" > 235< / a > < / span > < span class = "keyword" > struct < / span > < a class = "code hl_struct" href = "structlooped__elem__to__loc.html" > looped_elem_to_loc< / a > < 1, offset_t> {< / div >
< div class = "line" > < a id = "l00236" name = "l00236" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#a7aebc0b0656e3a55d0dbca27a57d600e" > 236< / a > < / span > offset_t < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > {0};< / div >
< div class = "line" > < a id = "l00237" name = "l00237" > < / a > < span class = "lineno" > 237< / span > < / div >
< div class = "foldopen" id = "foldopen00238" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00238" name = "l00238" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#a96cf2987c04210c9197e5237e425c4b4" > 238< / a > < / span > < span class = "keywordtype" > void< / span > < a class = "code hl_function" href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#a96cf2987c04210c9197e5237e425c4b4" > next< / a > (< span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > *, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > * strides) {< / div >
< div class = "line" > < a id = "l00239" name = "l00239" > < / a > < span class = "lineno" > 239< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > += strides[0];< / div >
< div class = "line" > < a id = "l00240" name = "l00240" > < / a > < span class = "lineno" > 240< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00241" name = "l00241" > < / a > < span class = "lineno" > 241< / span > < / div >
< div class = "foldopen" id = "foldopen00242" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00242" name = "l00242" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#af2984b35f7d7300d4812e7872b3c8851" > 242< / a > < / span > < span class = "keywordtype" > void< / span > < a class = "code hl_function" href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#af2984b35f7d7300d4812e7872b3c8851" > next< / a > (< span class = "keywordtype" > int< / span > n, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > *, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > * strides) {< / div >
< div class = "line" > < a id = "l00243" name = "l00243" > < / a > < span class = "lineno" > 243< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > += n * strides[0];< / div >
< div class = "line" > < a id = "l00244" name = "l00244" > < / a > < span class = "lineno" > 244< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00245" name = "l00245" > < / a > < span class = "lineno" > 245< / span > < / div >
< div class = "line" > < a id = "l00246" name = "l00246" > < / a > < span class = "lineno" > 246< / span > offset_t< / div >
< div class = "foldopen" id = "foldopen00247" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00247" name = "l00247" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#a368d2a2204cee5055386954acd5ccb90" > 247< / a > < / span > < a class = "code hl_function" href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#a368d2a2204cee5055386954acd5ccb90" > location< / a > (offset_t, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > *, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > *, < span class = "keywordtype" > int< / span > ) {< / div >
< div class = "line" > < a id = "l00248" name = "l00248" > < / a > < span class = "lineno" > 248< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_variable" href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > offset< / a > ;< / div >
< div class = "line" > < a id = "l00249" name = "l00249" > < / a > < span class = "lineno" > 249< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00250" name = "l00250" > < / a > < span class = "lineno" > 250< / span > };< / div >
< / div >
< div class = "line" > < a id = "l00251" name = "l00251" > < / a > < span class = "lineno" > 251< / span > < / div >
< div class = "line" > < a id = "l00252" name = "l00252" > < / a > < span class = "lineno" > 252< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > offset_t> < / div >
< div class = "foldopen" id = "foldopen00253" data-start = "{" data-end = "};" >
< div class = "line" > < a id = "l00253" name = "l00253" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html" > 253< / a > < / span > < span class = "keyword" > struct < / span > < a class = "code hl_struct" href = "structlooped__elem__to__loc.html" > looped_elem_to_loc< / a > < 0, offset_t> {< / div >
< div class = "line" > < a id = "l00254" name = "l00254" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#aa1e9e1009c16befb9a730835836436e0" > 254< / a > < / span > < span class = "keywordtype" > void< / span > < a class = "code hl_function" href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#aa1e9e1009c16befb9a730835836436e0" > next< / a > (< span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > *, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > *) {}< / div >
< div class = "line" > < a id = "l00255" name = "l00255" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#a1064cdfdcef779b5628ce5357a6fe4f0" > 255< / a > < / span > < span class = "keywordtype" > void< / span > < a class = "code hl_function" href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#a1064cdfdcef779b5628ce5357a6fe4f0" > next< / a > (< span class = "keywordtype" > int< / span > , < span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > *, < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > *) {}< / div >
< div class = "line" > < a id = "l00256" name = "l00256" > < / a > < span class = "lineno" > 256< / span > < / div >
< div class = "foldopen" id = "foldopen00257" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00257" name = "l00257" > < / a > < span class = "lineno" > < a class = "line" href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#a8c7aaffda0ca500d9f9566e5e74217a2" > 257< / a > < / span > offset_t < a class = "code hl_function" href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#a8c7aaffda0ca500d9f9566e5e74217a2" > location< / a > (< / div >
< div class = "line" > < a id = "l00258" name = "l00258" > < / a > < span class = "lineno" > 258< / span > offset_t idx,< / div >
< div class = "line" > < a id = "l00259" name = "l00259" > < / a > < span class = "lineno" > 259< / span > < span class = "keyword" > const< / span > constant < span class = "keywordtype" > int< / span > * shape,< / div >
< div class = "line" > < a id = "l00260" name = "l00260" > < / a > < span class = "lineno" > 260< / span > < span class = "keyword" > const< / span > constant < span class = "keywordtype" > size_t< / span > * strides,< / div >
< div class = "line" > < a id = "l00261" name = "l00261" > < / a > < span class = "lineno" > 261< / span > < span class = "keywordtype" > int< / span > ndim) {< / div >
< div class = "line" > < a id = "l00262" name = "l00262" > < / a > < span class = "lineno" > 262< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a8fd0c8fc6058e650fc99bca8b6acd7d1" > elem_to_loc< / a > (idx, shape, strides, ndim);< / div >
< div class = "line" > < a id = "l00263" name = "l00263" > < / a > < span class = "lineno" > 263< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00264" name = "l00264" > < / a > < span class = "lineno" > 264< / span > };< / div >
< / div >
< div class = "line" > < a id = "l00265" name = "l00265" > < / a > < span class = "lineno" > 265< / span > < / div >
< div class = "line" > < a id = "l00267" name = "l00267" > < / a > < span class = "lineno" > 267< / span > < span class = "comment" > // Calculation utils< / span > < / div >
< div class = "line" > < a id = "l00269" name = "l00269" > < / a > < span class = "lineno" > 269< / span > < / div >
< div class = "line" > < a id = "l00271" name = "l00271" > < / a > < span class = "lineno" > 271< / span > < span class = "keyword" > template< / span > < < span class = "keyword" > typename< / span > T, < span class = "keyword" > typename< / span > U> < / div >
< div class = "foldopen" id = "foldopen00272" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00272" name = "l00272" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a8e5a4b0fb5d018d7b078d147efe4f1e3" > 272< / a > < / span > < span class = "keyword" > inline< / span > T < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a8e5a4b0fb5d018d7b078d147efe4f1e3" > ceildiv< / a > (T N, U M) {< / div >
< div class = "line" > < a id = "l00273" name = "l00273" > < / a > < span class = "lineno" > 273< / span > < span class = "keywordflow" > return< / span > (N + M - 1) / M;< / div >
< div class = "line" > < a id = "l00274" name = "l00274" > < / a > < span class = "lineno" > 274< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00275" name = "l00275" > < / a > < span class = "lineno" > 275< / span > < / div >
< div class = "line" > < a id = "l00276" name = "l00276" > < / a > < span class = "lineno" > 276< / span > < span class = "comment" > // https://docs.oracle.com/cd/E19957-01/806-3568/ncg_goldberg.html#1202< / span > < / div >
< div class = "foldopen" id = "foldopen00277" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00277" name = "l00277" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a27c03f2f90ab56db2e4d59559a3d2e9a" > 277< / a > < / span > < span class = "keyword" > inline< / span > < span class = "keywordtype" > float< / span > < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a27c03f2f90ab56db2e4d59559a3d2e9a" > log1p< / a > (< span class = "keywordtype" > float< / span > x) {< / div >
< div class = "line" > < a id = "l00278" name = "l00278" > < / a > < span class = "lineno" > 278< / span > < span class = "keywordtype" > float< / span > xp1 = 1.0f + x;< / div >
< div class = "line" > < a id = "l00279" name = "l00279" > < / a > < span class = "lineno" > 279< / span > < span class = "keywordflow" > if< / span > (xp1 == < a class = "code hl_struct" href = "struct_limits.html" > Limits< float> ::max< / a > ) {< / div >
< div class = "line" > < a id = "l00280" name = "l00280" > < / a > < span class = "lineno" > 280< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_struct" href = "struct_limits.html" > Limits< float> ::max< / a > ;< / div >
< div class = "line" > < a id = "l00281" name = "l00281" > < / a > < span class = "lineno" > 281< / span > }< / div >
< div class = "line" > < a id = "l00282" name = "l00282" > < / a > < span class = "lineno" > 282< / span > < span class = "keywordflow" > if< / span > (xp1 == 1.0f) {< / div >
< div class = "line" > < a id = "l00283" name = "l00283" > < / a > < span class = "lineno" > 283< / span > < span class = "keywordflow" > return< / span > x;< / div >
< div class = "line" > < a id = "l00284" name = "l00284" > < / a > < span class = "lineno" > 284< / span > }< / div >
< div class = "line" > < a id = "l00285" name = "l00285" > < / a > < span class = "lineno" > 285< / span > < / div >
< div class = "line" > < a id = "l00286" name = "l00286" > < / a > < span class = "lineno" > 286< / span > < span class = "keywordflow" > return< / span > x * (< a class = "code hl_function" href = "namespacemetal.html#a423a9f4f2fc7ef5ec7eda061277b51b6" > metal::log< / a > (xp1) / (xp1 - 1.0f));< / div >
< div class = "line" > < a id = "l00287" name = "l00287" > < / a > < span class = "lineno" > 287< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00288" name = "l00288" > < / a > < span class = "lineno" > 288< / span > < / div >
< div class = "foldopen" id = "foldopen00289" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00289" name = "l00289" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a3501b665c8837eabf9789ea27a7d6946" > 289< / a > < / span > < span class = "keyword" > inline< / span > < a class = "code hl_struct" href = "struct___m_l_x___b_float16.html" > bfloat16_t< / a > < a class = "code hl_function" href = "backend_2metal_2kernels_2utils_8h.html#a27c03f2f90ab56db2e4d59559a3d2e9a" > log1p< / a > (< a class = "code hl_struct" href = "struct___m_l_x___b_float16.html" > bfloat16_t< / a > x) {< / div >
< div class = "line" > < a id = "l00290" name = "l00290" > < / a > < span class = "lineno" > 290< / span > < span class = "keywordtype" > float< / span > xp1 = 1.0f + < span class = "keyword" > static_cast< < / span > < span class = "keywordtype" > float< / span > < span class = "keyword" > > < / span > (x);< / div >
< div class = "line" > < a id = "l00291" name = "l00291" > < / a > < span class = "lineno" > 291< / span > < span class = "keywordflow" > if< / span > (xp1 == < a class = "code hl_struct" href = "struct_limits.html" > Limits< float> ::max< / a > ) {< / div >
< div class = "line" > < a id = "l00292" name = "l00292" > < / a > < span class = "lineno" > 292< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_struct" href = "struct_limits.html" > Limits< bfloat16_t> ::max< / a > ;< / div >
< div class = "line" > < a id = "l00293" name = "l00293" > < / a > < span class = "lineno" > 293< / span > }< / div >
< div class = "line" > < a id = "l00294" name = "l00294" > < / a > < span class = "lineno" > 294< / span > < span class = "keywordflow" > if< / span > (xp1 == 1.0f) {< / div >
< div class = "line" > < a id = "l00295" name = "l00295" > < / a > < span class = "lineno" > 295< / span > < span class = "keywordflow" > return< / span > x;< / div >
< div class = "line" > < a id = "l00296" name = "l00296" > < / a > < span class = "lineno" > 296< / span > }< / div >
< div class = "line" > < a id = "l00297" name = "l00297" > < / a > < span class = "lineno" > 297< / span > < / div >
< div class = "line" > < a id = "l00298" name = "l00298" > < / a > < span class = "lineno" > 298< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_typedef" href = "backend_2metal_2kernels_2bf16_8h.html#a7782de82393104dd4ad754ce3b316e82" > bfloat16_t< / a > (x * (< a class = "code hl_function" href = "namespacemetal.html#a423a9f4f2fc7ef5ec7eda061277b51b6" > metal::log< / a > (xp1) / (xp1 - 1.0f)));< / div >
< div class = "line" > < a id = "l00299" name = "l00299" > < / a > < span class = "lineno" > 299< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00300" name = "l00300" > < / a > < span class = "lineno" > 300< / span > < / div >
< div class = "line" > < a id = "l00302" name = "l00302" > < / a > < span class = "lineno" > 302< / span > < span class = "comment" > // SIMD shuffle ops< / span > < / div >
< div class = "line" > < a id = "l00304" name = "l00304" > < / a > < span class = "lineno" > 304< / span > < / div >
< div class = "foldopen" id = "foldopen00305" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00305" name = "l00305" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#aba6279624b1d30c525efee856a222b5c" > 305< / a > < / span > < span class = "keyword" > inline< / span > uint64_t < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > simd_shuffle_down< / a > (uint64_t data, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00306" name = "l00306" > < / a > < span class = "lineno" > 306< / span > < span class = "keywordflow" > return< / span > as_type< uint64_t> (< / div >
< div class = "line" > < a id = "l00307" name = "l00307" > < / a > < span class = "lineno" > 307< / span > < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > metal::simd_shuffle_down< / a > (as_type< uint2> (data), delta));< / div >
< div class = "line" > < a id = "l00308" name = "l00308" > < / a > < span class = "lineno" > 308< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00309" name = "l00309" > < / a > < span class = "lineno" > 309< / span > < / div >
< div class = "foldopen" id = "foldopen00310" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00310" name = "l00310" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a0c1e4d782fcc56e1ab5565cef12430dd" > 310< / a > < / span > < span class = "keyword" > inline< / span > int64_t < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > simd_shuffle_down< / a > (int64_t data, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00311" name = "l00311" > < / a > < span class = "lineno" > 311< / span > < span class = "keywordflow" > return< / span > as_type< int64_t> (< / div >
< div class = "line" > < a id = "l00312" name = "l00312" > < / a > < span class = "lineno" > 312< / span > < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > metal::simd_shuffle_down< / a > (as_type< uint2> (data), delta));< / div >
< div class = "line" > < a id = "l00313" name = "l00313" > < / a > < span class = "lineno" > 313< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00314" name = "l00314" > < / a > < span class = "lineno" > 314< / span > < / div >
< div class = "foldopen" id = "foldopen00315" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00315" name = "l00315" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a48ae83a8caf5c74810df60b6c6cdb062" > 315< / a > < / span > < span class = "keyword" > inline< / span > < span class = "keywordtype" > bool< / span > < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > simd_shuffle_down< / a > (< span class = "keywordtype" > bool< / span > data, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00316" name = "l00316" > < / a > < span class = "lineno" > 316< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > simd_shuffle_down< / a > (< span class = "keyword" > static_cast< < / span > uint32_t< span class = "keyword" > > < / span > (data), delta);< / div >
< div class = "line" > < a id = "l00317" name = "l00317" > < / a > < span class = "lineno" > 317< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00318" name = "l00318" > < / a > < span class = "lineno" > 318< / span > < / div >
< div class = "foldopen" id = "foldopen00319" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00319" name = "l00319" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#ad9a671a5f9aaa729ae7a77026f16bcb0" > 319< / a > < / span > < span class = "keyword" > inline< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > simd_shuffle_down< / a > (< a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > data, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00320" name = "l00320" > < / a > < span class = "lineno" > 320< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > (< / div >
< div class = "line" > < a id = "l00321" name = "l00321" > < / a > < span class = "lineno" > 321< / span > < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > simd_shuffle_down< / a > (data.< a class = "code hl_variable" href = "structcomplex64__t.html#abbd4a0092eca9f112c1c5ae1a133a27e" > real< / a > , delta), < a class = "code hl_function" href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > simd_shuffle_down< / a > (data.< a class = "code hl_variable" href = "structcomplex64__t.html#a94037c0cf8451aaff7cb4d154a8426de" > imag< / a > , delta));< / div >
< div class = "line" > < a id = "l00322" name = "l00322" > < / a > < span class = "lineno" > 322< / span > }< / div >
< / div >
2024-10-26 04:23:45 +08:00
< div class = "line" > < a id = "l00323" name = "l00323" > < / a > < span class = "lineno" > 323< / span > < / div >
< div class = "foldopen" id = "foldopen00324" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00324" name = "l00324" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a39e436e0a942912266aae7e0bd82d7c0" > 324< / a > < / span > < span class = "keyword" > inline< / span > uint64_t < a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > simd_shuffle_up< / a > (uint64_t data, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00325" name = "l00325" > < / a > < span class = "lineno" > 325< / span > < span class = "keywordflow" > return< / span > as_type< uint64_t> (< a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > metal::simd_shuffle_up< / a > (as_type< uint2> (data), delta));< / div >
< div class = "line" > < a id = "l00326" name = "l00326" > < / a > < span class = "lineno" > 326< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00327" name = "l00327" > < / a > < span class = "lineno" > 327< / span > < / div >
< div class = "foldopen" id = "foldopen00328" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00328" name = "l00328" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a617f3857caf33c569afa6148135f8b7a" > 328< / a > < / span > < span class = "keyword" > inline< / span > int64_t < a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > simd_shuffle_up< / a > (int64_t data, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00329" name = "l00329" > < / a > < span class = "lineno" > 329< / span > < span class = "keywordflow" > return< / span > as_type< int64_t> (< a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > metal::simd_shuffle_up< / a > (as_type< uint2> (data), delta));< / div >
< div class = "line" > < a id = "l00330" name = "l00330" > < / a > < span class = "lineno" > 330< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00331" name = "l00331" > < / a > < span class = "lineno" > 331< / span > < / div >
< div class = "foldopen" id = "foldopen00332" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00332" name = "l00332" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#ae0f5c42020275a588234e69f1eb7a485" > 332< / a > < / span > < span class = "keyword" > inline< / span > < span class = "keywordtype" > bool< / span > < a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > simd_shuffle_up< / a > (< span class = "keywordtype" > bool< / span > data, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00333" name = "l00333" > < / a > < span class = "lineno" > 333< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > simd_shuffle_up< / a > (< span class = "keyword" > static_cast< < / span > uint32_t< span class = "keyword" > > < / span > (data), delta);< / div >
< div class = "line" > < a id = "l00334" name = "l00334" > < / a > < span class = "lineno" > 334< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00335" name = "l00335" > < / a > < span class = "lineno" > 335< / span > < / div >
< div class = "foldopen" id = "foldopen00336" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00336" name = "l00336" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a92b455bac6a23af51c35ea83de2383eb" > 336< / a > < / span > < span class = "keyword" > inline< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > < a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > simd_shuffle_up< / a > (< a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > data, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00337" name = "l00337" > < / a > < span class = "lineno" > 337< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > (< / div >
< div class = "line" > < a id = "l00338" name = "l00338" > < / a > < span class = "lineno" > 338< / span > < a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > simd_shuffle_up< / a > (data.< a class = "code hl_variable" href = "structcomplex64__t.html#abbd4a0092eca9f112c1c5ae1a133a27e" > real< / a > , delta), < a class = "code hl_function" href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > simd_shuffle_up< / a > (data.< a class = "code hl_variable" href = "structcomplex64__t.html#a94037c0cf8451aaff7cb4d154a8426de" > imag< / a > , delta));< / div >
< div class = "line" > < a id = "l00339" name = "l00339" > < / a > < span class = "lineno" > 339< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00340" name = "l00340" > < / a > < span class = "lineno" > 340< / span > < / div >
< div class = "line" > < a id = "l00341" name = "l00341" > < / a > < span class = "lineno" > 341< / span > < span class = "keyword" > inline< / span > uint64_t< / div >
< div class = "foldopen" id = "foldopen00342" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00342" name = "l00342" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a5862d5ea154c9b76cf56a630cf6385b4" > 342< / a > < / span > < a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > simd_shuffle_and_fill_up< / a > (uint64_t data, uint64_t filling, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00343" name = "l00343" > < / a > < span class = "lineno" > 343< / span > < span class = "keywordflow" > return< / span > as_type< uint64_t> (< a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > metal::simd_shuffle_and_fill_up< / a > (< / div >
< div class = "line" > < a id = "l00344" name = "l00344" > < / a > < span class = "lineno" > 344< / span > as_type< uint2> (data), as_type< uint2> (filling), delta));< / div >
< div class = "line" > < a id = "l00345" name = "l00345" > < / a > < span class = "lineno" > 345< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00346" name = "l00346" > < / a > < span class = "lineno" > 346< / span > < / div >
< div class = "line" > < a id = "l00347" name = "l00347" > < / a > < span class = "lineno" > 347< / span > < span class = "keyword" > inline< / span > int64_t< / div >
< div class = "foldopen" id = "foldopen00348" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00348" name = "l00348" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a7bb56415c5412a6a26f70a990915f064" > 348< / a > < / span > < a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > simd_shuffle_and_fill_up< / a > (int64_t data, int64_t filling, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00349" name = "l00349" > < / a > < span class = "lineno" > 349< / span > < span class = "keywordflow" > return< / span > as_type< int64_t> (< a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > metal::simd_shuffle_and_fill_up< / a > (< / div >
< div class = "line" > < a id = "l00350" name = "l00350" > < / a > < span class = "lineno" > 350< / span > as_type< uint2> (data), as_type< uint2> (filling), delta));< / div >
< div class = "line" > < a id = "l00351" name = "l00351" > < / a > < span class = "lineno" > 351< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00352" name = "l00352" > < / a > < span class = "lineno" > 352< / span > < / div >
< div class = "foldopen" id = "foldopen00353" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00353" name = "l00353" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#ad55bd473647f2c6c68e65e5312c132d1" > 353< / a > < / span > < span class = "keyword" > inline< / span > < span class = "keywordtype" > bool< / span > < a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > simd_shuffle_and_fill_up< / a > (< span class = "keywordtype" > bool< / span > data, < span class = "keywordtype" > bool< / span > filling, uint16_t delta) {< / div >
< div class = "line" > < a id = "l00354" name = "l00354" > < / a > < span class = "lineno" > 354< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > simd_shuffle_and_fill_up< / a > (< / div >
< div class = "line" > < a id = "l00355" name = "l00355" > < / a > < span class = "lineno" > 355< / span > < span class = "keyword" > static_cast< < / span > uint32_t< span class = "keyword" > > < / span > (data), < span class = "keyword" > static_cast< < / span > uint32_t< span class = "keyword" > > < / span > (filling), delta);< / div >
< div class = "line" > < a id = "l00356" name = "l00356" > < / a > < span class = "lineno" > 356< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00357" name = "l00357" > < / a > < span class = "lineno" > 357< / span > < / div >
< div class = "foldopen" id = "foldopen00358" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00358" name = "l00358" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a94e02a6ae8c39cbf4cb23aa44df9dbd5" > 358< / a > < / span > < span class = "keyword" > inline< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > < a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > simd_shuffle_and_fill_up< / a > (< / div >
< div class = "line" > < a id = "l00359" name = "l00359" > < / a > < span class = "lineno" > 359< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > data,< / div >
< div class = "line" > < a id = "l00360" name = "l00360" > < / a > < span class = "lineno" > 360< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > filling,< / div >
< div class = "line" > < a id = "l00361" name = "l00361" > < / a > < span class = "lineno" > 361< / span > uint16_t delta) {< / div >
< div class = "line" > < a id = "l00362" name = "l00362" > < / a > < span class = "lineno" > 362< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > (< / div >
< div class = "line" > < a id = "l00363" name = "l00363" > < / a > < span class = "lineno" > 363< / span > < a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > simd_shuffle_and_fill_up< / a > (data.< a class = "code hl_variable" href = "structcomplex64__t.html#abbd4a0092eca9f112c1c5ae1a133a27e" > real< / a > , filling.< a class = "code hl_variable" href = "structcomplex64__t.html#abbd4a0092eca9f112c1c5ae1a133a27e" > real< / a > , delta),< / div >
< div class = "line" > < a id = "l00364" name = "l00364" > < / a > < span class = "lineno" > 364< / span > < a class = "code hl_function" href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > simd_shuffle_and_fill_up< / a > (data.< a class = "code hl_variable" href = "structcomplex64__t.html#a94037c0cf8451aaff7cb4d154a8426de" > imag< / a > , filling.< a class = "code hl_variable" href = "structcomplex64__t.html#a94037c0cf8451aaff7cb4d154a8426de" > imag< / a > , delta));< / div >
< div class = "line" > < a id = "l00365" name = "l00365" > < / a > < span class = "lineno" > 365< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00366" name = "l00366" > < / a > < span class = "lineno" > 366< / span > < / div >
< div class = "foldopen" id = "foldopen00367" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00367" name = "l00367" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a71986ecdd7d18f975dd22c3df7421ce2" > 367< / a > < / span > < span class = "keyword" > inline< / span > uint64_t < a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > simd_shuffle< / a > (uint64_t data, uint16_t lane) {< / div >
< div class = "line" > < a id = "l00368" name = "l00368" > < / a > < span class = "lineno" > 368< / span > < span class = "keywordflow" > return< / span > as_type< uint64_t> (< a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > metal::simd_shuffle< / a > (as_type< uint2> (data), lane));< / div >
< div class = "line" > < a id = "l00369" name = "l00369" > < / a > < span class = "lineno" > 369< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00370" name = "l00370" > < / a > < span class = "lineno" > 370< / span > < / div >
< div class = "foldopen" id = "foldopen00371" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00371" name = "l00371" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#a3bdbdfeb7a1dde40cd3ce1df8d9213b5" > 371< / a > < / span > < span class = "keyword" > inline< / span > int64_t < a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > simd_shuffle< / a > (int64_t data, uint16_t lane) {< / div >
< div class = "line" > < a id = "l00372" name = "l00372" > < / a > < span class = "lineno" > 372< / span > < span class = "keywordflow" > return< / span > as_type< int64_t> (< a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > metal::simd_shuffle< / a > (as_type< uint2> (data), lane));< / div >
< div class = "line" > < a id = "l00373" name = "l00373" > < / a > < span class = "lineno" > 373< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00374" name = "l00374" > < / a > < span class = "lineno" > 374< / span > < / div >
< div class = "foldopen" id = "foldopen00375" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00375" name = "l00375" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#ab4cbcdb054f9165130da91a3334da0cf" > 375< / a > < / span > < span class = "keyword" > inline< / span > < span class = "keywordtype" > bool< / span > < a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > simd_shuffle< / a > (< span class = "keywordtype" > bool< / span > data, uint16_t lane) {< / div >
< div class = "line" > < a id = "l00376" name = "l00376" > < / a > < span class = "lineno" > 376< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > simd_shuffle< / a > (< span class = "keyword" > static_cast< < / span > uint32_t< span class = "keyword" > > < / span > (data), lane);< / div >
< div class = "line" > < a id = "l00377" name = "l00377" > < / a > < span class = "lineno" > 377< / span > }< / div >
< / div >
< div class = "line" > < a id = "l00378" name = "l00378" > < / a > < span class = "lineno" > 378< / span > < / div >
< div class = "foldopen" id = "foldopen00379" data-start = "{" data-end = "}" >
< div class = "line" > < a id = "l00379" name = "l00379" > < / a > < span class = "lineno" > < a class = "line" href = "backend_2metal_2kernels_2utils_8h.html#ab8175b66bcc080fb89f738143568c30b" > 379< / a > < / span > < span class = "keyword" > inline< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > < a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > simd_shuffle< / a > (< a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > data, uint16_t lane) {< / div >
< div class = "line" > < a id = "l00380" name = "l00380" > < / a > < span class = "lineno" > 380< / span > < span class = "keywordflow" > return< / span > < a class = "code hl_struct" href = "structcomplex64__t.html" > complex64_t< / a > (< / div >
< div class = "line" > < a id = "l00381" name = "l00381" > < / a > < span class = "lineno" > 381< / span > < a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > simd_shuffle< / a > (data.< a class = "code hl_variable" href = "structcomplex64__t.html#abbd4a0092eca9f112c1c5ae1a133a27e" > real< / a > , lane), < a class = "code hl_function" href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > simd_shuffle< / a > (data.< a class = "code hl_variable" href = "structcomplex64__t.html#a94037c0cf8451aaff7cb4d154a8426de" > imag< / a > , lane));< / div >
< div class = "line" > < a id = "l00382" name = "l00382" > < / a > < span class = "lineno" > 382< / span > }< / div >
< / div >
< div class = "ttc" id = "abackend_2metal_2allocator_8h_html_ae704ab07eac590091daa5fc4aec7bddb" > < div class = "ttname" > < a href = "backend_2metal_2allocator_8h.html#ae704ab07eac590091daa5fc4aec7bddb" > next< / a > < / div > < div class = "ttdeci" > BufferHolder * next< / div > < div class = "ttdef" > < b > Definition< / b > allocator.h:38< / div > < / div >
2024-10-15 23:12:17 +08:00
< div class = "ttc" id = "abackend_2metal_2kernels_2bf16_8h_html" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2bf16_8h.html" > bf16.h< / a > < / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2bf16_8h_html_a7782de82393104dd4ad754ce3b316e82" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2bf16_8h.html#a7782de82393104dd4ad754ce3b316e82" > bfloat16_t< / a > < / div > < div class = "ttdeci" > struct _MLX_BFloat16 bfloat16_t< / div > < div class = "ttdef" > < b > Definition< / b > bf16.h:257< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2complex_8h_html" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2complex_8h.html" > complex.h< / a > < / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_a01c9309978a6c12f79b6e4108728a953" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#a01c9309978a6c12f79b6e4108728a953" > elem_to_loc_2_nd< / a > < / div > < div class = "ttdeci" > METAL_FUNC ulong2 elem_to_loc_2_nd(uint3 elem, constant const int *shape, constant const stride_t *a_strides, constant const stride_t *b_strides, int ndim)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:153< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_a196a07022b812b241d4c06192c0fa83d" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#a196a07022b812b241d4c06192c0fa83d" > elem_to_loc_1< / a > < / div > < div class = "ttdeci" > METAL_FUNC stride_t elem_to_loc_1(uint elem, constant const stride_t & stride)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:133< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_a1e520e23f58ca645dea1ac20998d987a" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#a1e520e23f58ca645dea1ac20998d987a" > instantiate_float_limit< / a > < / div > < div class = "ttdeci" > #define instantiate_float_limit(type)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:44< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_a27c03f2f90ab56db2e4d59559a3d2e9a" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#a27c03f2f90ab56db2e4d59559a3d2e9a" > log1p< / a > < / div > < div class = "ttdeci" > float log1p(float x)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:277< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_a2c34ed54714c69e6e1b44344f9e6e330" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#a2c34ed54714c69e6e1b44344f9e6e330" > elem_to_loc_3< / a > < / div > < div class = "ttdeci" > METAL_FUNC stride_t elem_to_loc_3(uint3 elem, constant const stride_t strides[3])< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:145< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_a66940b1cc3d64651d24634bc696d528b" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#a66940b1cc3d64651d24634bc696d528b" > elem_to_loc_3_nd< / a > < / div > < div class = "ttdeci" > METAL_FUNC ulong3 elem_to_loc_3_nd(uint3 elem, constant const int *shape, constant const size_t *a_strides, constant const size_t *b_strides, constant const size_t *c_strides, int ndim)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:171< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_a8e5a4b0fb5d018d7b078d147efe4f1e3" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#a8e5a4b0fb5d018d7b078d147efe4f1e3" > ceildiv< / a > < / div > < div class = "ttdeci" > T ceildiv(T N, U M)< / div > < div class = "ttdoc" > Compute ceil((float)N/(float)M)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:272< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_a8fd0c8fc6058e650fc99bca8b6acd7d1" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#a8fd0c8fc6058e650fc99bca8b6acd7d1" > elem_to_loc< / a > < / div > < div class = "ttdeci" > METAL_FUNC stride_t elem_to_loc(uint elem, constant const int *shape, constant const stride_t *strides, int ndim)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:87< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_abedffa358e7ba7782cc78d6772064c7c" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#abedffa358e7ba7782cc78d6772064c7c" > instantiate_default_limit< / a > < / div > < div class = "ttdeci" > #define instantiate_default_limit(type)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:24< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_acb8ddf4a29129846b673c50ba7078773" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#acb8ddf4a29129846b673c50ba7078773" > float16_t< / a > < / div > < div class = "ttdeci" > half float16_t< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:10< / div > < / div >
< div class = "ttc" id = "abackend_2metal_2kernels_2utils_8h_html_ad6c45cacca97899cd362df49c06fea79" > < div class = "ttname" > < a href = "backend_2metal_2kernels_2utils_8h.html#ad6c45cacca97899cd362df49c06fea79" > elem_to_loc_2< / a > < / div > < div class = "ttdeci" > METAL_FUNC stride_t elem_to_loc_2(uint2 elem, constant const stride_t strides[2])< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:139< / div > < / div >
< div class = "ttc" id = "adefines_8h_html" > < div class = "ttname" > < a href = "defines_8h.html" > defines.h< / a > < / div > < / div >
2024-10-26 04:23:45 +08:00
< div class = "ttc" id = "anamespacemetal_html_a1ca14116bf50639b214d8414b5bbaaa6" > < div class = "ttname" > < a href = "namespacemetal.html#a1ca14116bf50639b214d8414b5bbaaa6" > metal::simd_shuffle_and_fill_up< / a > < / div > < div class = "ttdeci" > METAL_FUNC bfloat16_t simd_shuffle_and_fill_up(bfloat16_t data, bfloat16_t filling_data, ushort delta, ushort modulo)< / div > < div class = "ttdef" > < b > Definition< / b > bf16_math.h:391< / div > < / div >
< div class = "ttc" id = "anamespacemetal_html_a259ed115bc3c58f88eb35830916b26d4" > < div class = "ttname" > < a href = "namespacemetal.html#a259ed115bc3c58f88eb35830916b26d4" > metal::simd_shuffle< / a > < / div > < div class = "ttdeci" > METAL_FUNC bfloat16_t simd_shuffle(bfloat16_t data, ushort simd_lane_id)< / div > < div class = "ttdef" > < b > Definition< / b > bf16_math.h:391< / div > < / div >
2024-10-15 23:12:17 +08:00
< div class = "ttc" id = "anamespacemetal_html_a423a9f4f2fc7ef5ec7eda061277b51b6" > < div class = "ttname" > < a href = "namespacemetal.html#a423a9f4f2fc7ef5ec7eda061277b51b6" > metal::log< / a > < / div > < div class = "ttdeci" > METAL_FUNC bfloat16_t log(bfloat16_t x)< / div > < div class = "ttdef" > < b > Definition< / b > bf16_math.h:234< / div > < / div >
< div class = "ttc" id = "anamespacemetal_html_af6e2dd7ae087aba6abac4f0350b7611c" > < div class = "ttname" > < a href = "namespacemetal.html#af6e2dd7ae087aba6abac4f0350b7611c" > metal::simd_shuffle_down< / a > < / div > < div class = "ttdeci" > METAL_FUNC bfloat16_t simd_shuffle_down(bfloat16_t data, ushort delta)< / div > < div class = "ttdef" > < b > Definition< / b > bf16_math.h:391< / div > < / div >
2024-10-26 04:23:45 +08:00
< div class = "ttc" id = "anamespacemetal_html_afe81c5fbde3f4890458b081909242c55" > < div class = "ttname" > < a href = "namespacemetal.html#afe81c5fbde3f4890458b081909242c55" > metal::simd_shuffle_up< / a > < / div > < div class = "ttdeci" > METAL_FUNC bfloat16_t simd_shuffle_up(bfloat16_t data, ushort delta)< / div > < div class = "ttdef" > < b > Definition< / b > bf16_math.h:391< / div > < / div >
2024-10-15 23:12:17 +08:00
< div class = "ttc" id = "anamespacepocketfft_1_1detail_html_afb987c919e9424a996d0fc8b3c23cc84" > < div class = "ttname" > < a href = "namespacepocketfft_1_1detail.html#afb987c919e9424a996d0fc8b3c23cc84" > pocketfft::detail::stride_t< / a > < / div > < div class = "ttdeci" > std::vector< ptrdiff_t > stride_t< / div > < div class = "ttdef" > < b > Definition< / b > pocketfft.h:103< / div > < / div >
< div class = "ttc" id = "astruct___m_l_x___b_float16_html" > < div class = "ttname" > < a href = "struct___m_l_x___b_float16.html" > _MLX_BFloat16< / a > < / div > < div class = "ttdef" > < b > Definition< / b > bf16.h:54< / div > < / div >
< div class = "ttc" id = "astruct_limits_html" > < div class = "ttname" > < a href = "struct_limits.html" > Limits< / a > < / div > < div class = "ttdef" > < b > Definition< / b > utils.h:17< / div > < / div >
< div class = "ttc" id = "astruct_limits_html_a2f0673b6f9da89ce1d64f9f3d74f50a8" > < div class = "ttname" > < a href = "struct_limits.html#a2f0673b6f9da89ce1d64f9f3d74f50a8" > Limits::max< / a > < / div > < div class = "ttdeci" > static const constant U max< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:18< / div > < / div >
< div class = "ttc" id = "astruct_limits_html_a5a3eae6d244fbea2aa7b9200001463e5" > < div class = "ttname" > < a href = "struct_limits.html#a5a3eae6d244fbea2aa7b9200001463e5" > Limits::finite_max< / a > < / div > < div class = "ttdeci" > static const constant U finite_max< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:20< / div > < / div >
< div class = "ttc" id = "astruct_limits_html_a6e81584ba65a4dc6ff9366b458e3a20e" > < div class = "ttname" > < a href = "struct_limits.html#a6e81584ba65a4dc6ff9366b458e3a20e" > Limits::min< / a > < / div > < div class = "ttdeci" > static const constant U min< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:19< / div > < / div >
< div class = "ttc" id = "astruct_limits_html_ae7469d21f2688797ca3e388d919ef05e" > < div class = "ttname" > < a href = "struct_limits.html#ae7469d21f2688797ca3e388d919ef05e" > Limits::finite_min< / a > < / div > < div class = "ttdeci" > static const constant U finite_min< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:21< / div > < / div >
< div class = "ttc" id = "astructcomplex64__t_html" > < div class = "ttname" > < a href = "structcomplex64__t.html" > complex64_t< / a > < / div > < div class = "ttdef" > < b > Definition< / b > complex.h:20< / div > < / div >
< div class = "ttc" id = "astructcomplex64__t_html_a94037c0cf8451aaff7cb4d154a8426de" > < div class = "ttname" > < a href = "structcomplex64__t.html#a94037c0cf8451aaff7cb4d154a8426de" > complex64_t::imag< / a > < / div > < div class = "ttdeci" > float imag< / div > < div class = "ttdef" > < b > Definition< / b > complex.h:22< / div > < / div >
< div class = "ttc" id = "astructcomplex64__t_html_abbd4a0092eca9f112c1c5ae1a133a27e" > < div class = "ttname" > < a href = "structcomplex64__t.html#abbd4a0092eca9f112c1c5ae1a133a27e" > complex64_t::real< / a > < / div > < div class = "ttdeci" > float real< / div > < div class = "ttdef" > < b > Definition< / b > complex.h:21< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_3_010_00_01offset__t_01_4_html_a1064cdfdcef779b5628ce5357a6fe4f0" > < div class = "ttname" > < a href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#a1064cdfdcef779b5628ce5357a6fe4f0" > looped_elem_to_loc< 0, offset_t > ::next< / a > < / div > < div class = "ttdeci" > void next(int, const constant int *, const constant size_t *)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:255< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_3_010_00_01offset__t_01_4_html_a8c7aaffda0ca500d9f9566e5e74217a2" > < div class = "ttname" > < a href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#a8c7aaffda0ca500d9f9566e5e74217a2" > looped_elem_to_loc< 0, offset_t > ::location< / a > < / div > < div class = "ttdeci" > offset_t location(offset_t idx, const constant int *shape, const constant size_t *strides, int ndim)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:257< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_3_010_00_01offset__t_01_4_html_aa1e9e1009c16befb9a730835836436e0" > < div class = "ttname" > < a href = "structlooped__elem__to__loc_3_010_00_01offset__t_01_4.html#aa1e9e1009c16befb9a730835836436e0" > looped_elem_to_loc< 0, offset_t > ::next< / a > < / div > < div class = "ttdeci" > void next(const constant int *, const constant size_t *)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:254< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_3_011_00_01offset__t_01_4_html_a368d2a2204cee5055386954acd5ccb90" > < div class = "ttname" > < a href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#a368d2a2204cee5055386954acd5ccb90" > looped_elem_to_loc< 1, offset_t > ::location< / a > < / div > < div class = "ttdeci" > offset_t location(offset_t, const constant int *, const constant size_t *, int)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:247< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_3_011_00_01offset__t_01_4_html_a96cf2987c04210c9197e5237e425c4b4" > < div class = "ttname" > < a href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#a96cf2987c04210c9197e5237e425c4b4" > looped_elem_to_loc< 1, offset_t > ::next< / a > < / div > < div class = "ttdeci" > void next(const constant int *, const constant size_t *strides)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:238< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_3_011_00_01offset__t_01_4_html_af2984b35f7d7300d4812e7872b3c8851" > < div class = "ttname" > < a href = "structlooped__elem__to__loc_3_011_00_01offset__t_01_4.html#af2984b35f7d7300d4812e7872b3c8851" > looped_elem_to_loc< 1, offset_t > ::next< / a > < / div > < div class = "ttdeci" > void next(int n, const constant int *, const constant size_t *strides)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:242< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_html" > < div class = "ttname" > < a href = "structlooped__elem__to__loc.html" > looped_elem_to_loc< / a > < / div > < div class = "ttdef" > < b > Definition< / b > utils.h:197< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_html_a05558dabba889ee0d80ed4b567d901ca" > < div class = "ttname" > < a href = "structlooped__elem__to__loc.html#a05558dabba889ee0d80ed4b567d901ca" > looped_elem_to_loc::next< / a > < / div > < div class = "ttdeci" > void next(const constant int *shape, const constant size_t *strides)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:202< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_html_a11ef1389c9224e9117fd6374d740e0e0" > < div class = "ttname" > < a href = "structlooped__elem__to__loc.html#a11ef1389c9224e9117fd6374d740e0e0" > looped_elem_to_loc::offset< / a > < / div > < div class = "ttdeci" > offset_t offset< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:199< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_html_a29b154409551fea0a4ef50bf320ebc0a" > < div class = "ttname" > < a href = "structlooped__elem__to__loc.html#a29b154409551fea0a4ef50bf320ebc0a" > looped_elem_to_loc::index< / a > < / div > < div class = "ttdeci" > int index< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:200< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_html_a42c76764640618d721c48ef6b4f59189" > < div class = "ttname" > < a href = "structlooped__elem__to__loc.html#a42c76764640618d721c48ef6b4f59189" > looped_elem_to_loc::inner_looper< / a > < / div > < div class = "ttdeci" > looped_elem_to_loc< dim - 1, offset_t > inner_looper< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:198< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_html_accc6d4957a8aeb38f5062754793b74d2" > < div class = "ttname" > < a href = "structlooped__elem__to__loc.html#accc6d4957a8aeb38f5062754793b74d2" > looped_elem_to_loc::location< / a > < / div > < div class = "ttdeci" > offset_t location(offset_t, const constant int *, const constant size_t *, int)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:229< / div > < / div >
< div class = "ttc" id = "astructlooped__elem__to__loc_html_add610f331ef8d7d2d1917050890f82b2" > < div class = "ttname" > < a href = "structlooped__elem__to__loc.html#add610f331ef8d7d2d1917050890f82b2" > looped_elem_to_loc::next< / a > < / div > < div class = "ttdeci" > void next(int n, const constant int *shape, const constant size_t *strides)< / div > < div class = "ttdef" > < b > Definition< / b > utils.h:213< / div > < / div >
< / div > <!-- fragment --> < / div > <!-- contents -->
<!-- start footer part -->
< hr class = "footer" / > < address class = "footer" > < small >
Generated by  < a href = "https://www.doxygen.org/index.html" > < img class = "footer" src = "doxygen.svg" width = "104" height = "31" alt = "doxygen" / > < / a > 1.12.0
< / small > < / address >
< / div > <!-- doc - content -->
< / body >
< / html >