2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "https://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< html  xmlns = "http://www.w3.org/1999/xhtml"  lang = "en-US" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< head > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< meta  http-equiv = "Content-Type"  content = "text/xhtml;charset=UTF-8" / > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< meta  http-equiv = "X-UA-Compatible"  content = "IE=11" / > 
							 
						 
					
						
							
								
									
										
										
										
											2025-02-06 20:16:29 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								< meta  name = "generator"  content = "Doxygen 1.13.2" / > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								< meta  name = "viewport"  content = "width=device-width, initial-scale=1" / > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< title > MLX: mlx/backend/metal/kernels/steel/conv/kernels/steel_conv_general.h Source File< / title > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< link  href = "tabs.css"  rel = "stylesheet"  type = "text/css" / > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "jquery.js" > < / script > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "dynsections.js" > < / script > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "clipboard.js" > < / script > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< link  href = "navtree.css"  rel = "stylesheet"  type = "text/css" / > 
							 
						 
					
						
							
								
									
										
										
										
											2025-01-09 21:56:20 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "navtreedata.js" > < / script > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "navtree.js" > < / script > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "resize.js" > < / script > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "cookie.js" > < / script > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< link  href = "search/search.css"  rel = "stylesheet"  type = "text/css" / > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "search/searchdata.js" > < / script > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript"  src = "search/search.js" > < / script > 
							 
						 
					
						
							
								
									
										
										
										
											2025-01-09 21:56:20 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  $(function() { init_search(); });
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								/* @license-end */
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / script > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								< link  href = "doxygen.css"  rel = "stylesheet"  type = "text/css"  / > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / head > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< body > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "top" > <!--  do not remove this div, it is closed by doxygen!  --> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "titlearea" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< table  cellspacing = "0"  cellpadding = "0" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								 < tbody > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								 < tr  id = "projectrow" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  < td  id = "projectalign" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								   < div  id = "projectname" > MLX
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								   < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  < / td > 
							 
						 
					
						
							
								
									
										
										
										
											2025-01-09 21:56:20 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								    < td >         < div  id = "MSearchBox"  class = "MSearchBoxInactive" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								        < span  class = "left" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								          < span  id = "MSearchSelect"                 onmouseover = "return searchBox.OnSearchSelectShow()"                 onmouseout = "return searchBox.OnSearchSelectHide()" >   < / span > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								          < input  type = "text"  id = "MSearchField"  value = ""  placeholder = "Search"  accesskey = "S" 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								               onfocus="searchBox.OnSearchFieldFocus(true)" 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								               onblur="searchBox.OnSearchFieldFocus(false)" 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								               onkeyup="searchBox.OnSearchFieldChange(event)"/>
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								          < / span > < span  class = "right" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								            < a  id = "MSearchClose"  href = "javascript:searchBox.CloseResultsWindow()" > < img  id = "MSearchCloseImg"  border = "0"  src = "search/close.svg"  alt = "" / > < / a > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								          < / span > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								        < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / td > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								 < / tr > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								 < / tbody > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / table > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								<!--  end header part  --> 
							 
						 
					
						
							
								
									
										
										
										
											2025-02-06 20:16:29 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								<!--  Generated by Doxygen 1.13.2  --> 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								var searchBox = new SearchBox("searchBox", "search/",'.html');
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								/* @license-end */
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / script > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								$(function() { codefold.init(0); });
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								/* @license-end */
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / script > 
							 
						 
					
						
							
								
									
										
										
										
											2025-01-09 21:56:20 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								< / div > <!--  top  --> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "side-nav"  class = "ui-resizable side-nav-resizable" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  < div  id = "nav-tree" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								    < div  id = "nav-tree-contents" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								      < div  id = "nav-sync"  class = "sync" > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								    < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  < div  id = "splitbar"  style = "-moz-user-select:none;"  
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								       class="ui-resizable-handle">
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								< script  type = "text/javascript" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								/* @license magnet:?xt=urn:btih:d3d9a9a6595521f9666a5e94cc830dab83b65699& dn=expat.txt MIT */
							 
						 
					
						
							
								
									
										
										
										
											2025-01-09 21:56:20 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								$(function(){initNavTree('steel__conv__general_8h_source.html',''); initResizable(true); });
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								/* @license-end */
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / script > 
							 
						 
					
						
							
								
									
										
										
										
											2025-01-09 21:56:20 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								< div  id = "doc-content" > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								<!--  window showing the filter options  --> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "MSearchSelectWindow" 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								     onmouseover="return searchBox.OnSearchSelectShow()"
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								     onmouseout="return searchBox.OnSearchSelectHide()"
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								     onkeydown="return searchBox.OnSearchSelectKey(event)">
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								<!--  iframe showing the search results (closed by default)  --> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "MSearchResultsWindow" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "MSearchResults" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "SRPage" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "SRIndex" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "SRResults" > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "SRStatus"  id = "Loading" > Loading...< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "SRStatus"  id = "Searching" > Searching...< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "SRStatus"  id = "NoMatches" > No Matches< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "header" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  < div  class = "headertitle" > < div  class = "title" > steel_conv_general.h< / div > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > <!-- header --> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "contents" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< a  href = "steel__conv__general_8h.html" > Go to the documentation of this file.< / a > < div  class = "fragment" > < div  class = "line" > < a  id = "l00001"  name = "l00001" > < / a > < span  class = "lineno" >     1< / span > < span  class = "comment" > // Copyright © 2024 Apple Inc.< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00002"  name = "l00002" > < / a > < span  class = "lineno" >     2< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00003"  name = "l00003" > < / a > < span  class = "lineno" >     3< / span > < span  class = "preprocessor" > #include " < a  class = "code"  href = "loader__general_8h.html" > mlx/backend/metal/kernels/steel/conv/loaders/loader_general.h< / a > " < / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00004"  name = "l00004" > < / a > < span  class = "lineno" >     4< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00005"  name = "l00005" > < / a > < span  class = "lineno" >     5< / span > < span  class = "keyword" > template< / span >  < < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00006"  name = "l00006" > < / a > < span  class = "lineno" >     6< / span >     < span  class = "keyword" > typename< / span >  T,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00007"  name = "l00007" > < / a > < span  class = "lineno" >     7< / span >     < span  class = "keywordtype" > int< / span >  BM,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00008"  name = "l00008" > < / a > < span  class = "lineno" >     8< / span >     < span  class = "keywordtype" > int< / span >  BN,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00009"  name = "l00009" > < / a > < span  class = "lineno" >     9< / span >     < span  class = "keywordtype" > int< / span >  BK,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00010"  name = "l00010" > < / a > < span  class = "lineno" >    10< / span >     < span  class = "keywordtype" > int< / span >  WM,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00011"  name = "l00011" > < / a > < span  class = "lineno" >    11< / span >     < span  class = "keywordtype" > int< / span >  WN,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00012"  name = "l00012" > < / a > < span  class = "lineno" >    12< / span >     < span  class = "keyword" > typename< / span >  AccumType = float,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00013"  name = "l00013" > < / a > < span  class = "lineno" >    13< / span >     < span  class = "keyword" > typename< / span >  Epilogue = TransformNone< T, AccumType> > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00014"  name = "l00014" > < / a > < span  class = "lineno" >    14< / span > [[kernel, max_total_threads_per_threadgroup(WM* WN * 32)]] < span  class = "keywordtype" > void< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "foldopen"  id = "foldopen00015"  data-start = "{"  data-end = "}" > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00015"  name = "l00015" > < / a > < span  class = "lineno" > < a  class = "line"  href = "steel__conv__general_8h.html#ad620c0656ae92e36dcb4a285d9e790ee" >    15< / a > < / span > < a  class = "code hl_function"  href = "steel__conv__general_8h.html#ad620c0656ae92e36dcb4a285d9e790ee" > implicit_gemm_conv_2d_general< / a > (< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00016"  name = "l00016" > < / a > < span  class = "lineno" >    16< / span >     < span  class = "keyword" > const< / span >  device T* A [[buffer(0)]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00017"  name = "l00017" > < / a > < span  class = "lineno" >    17< / span >     < span  class = "keyword" > const< / span >  device T* B [[buffer(1)]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00018"  name = "l00018" > < / a > < span  class = "lineno" >    18< / span >     device T* C [[buffer(2)]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00019"  name = "l00019" > < / a > < span  class = "lineno" >    19< / span >     < span  class = "keyword" > const< / span >  constant < a  class = "code hl_struct"  href = "struct_m_l_x_conv_params.html" > MLXConvParams< 2> < / a > * params [[buffer(3)]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00020"  name = "l00020" > < / a > < span  class = "lineno" >    20< / span >     < span  class = "keyword" > const< / span >  constant ImplicitGemmConv2DParams* gemm_params [[buffer(4)]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00021"  name = "l00021" > < / a > < span  class = "lineno" >    21< / span >     < span  class = "keyword" > const< / span >  constant Conv2DGeneralJumpParams* jump_params [[buffer(5)]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00022"  name = "l00022" > < / a > < span  class = "lineno" >    22< / span >     < span  class = "keyword" > const< / span >  constant Conv2DGeneralBaseInfo* base_h [[buffer(6)]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00023"  name = "l00023" > < / a > < span  class = "lineno" >    23< / span >     < span  class = "keyword" > const< / span >  constant Conv2DGeneralBaseInfo* base_w [[buffer(7)]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00024"  name = "l00024" > < / a > < span  class = "lineno" >    24< / span >     uint3 tid [[threadgroup_position_in_grid]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00025"  name = "l00025" > < / a > < span  class = "lineno" >    25< / span >     uint3 lid [[thread_position_in_threadgroup]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00026"  name = "l00026" > < / a > < span  class = "lineno" >    26< / span >     uint simd_gid [[simdgroup_index_in_threadgroup]],< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00027"  name = "l00027" > < / a > < span  class = "lineno" >    27< / span >     uint simd_lid [[thread_index_in_simdgroup]]) {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00028"  name = "l00028" > < / a > < span  class = "lineno" >    28< / span >   (void)lid;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00029"  name = "l00029" > < / a > < span  class = "lineno" >    29< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00030"  name = "l00030" > < / a > < span  class = "lineno" >    30< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > bool< / span >  transpose_a = < span  class = "keyword" > false< / span > ;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00031"  name = "l00031" > < / a > < span  class = "lineno" >    31< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > bool< / span >  transpose_b = < span  class = "keyword" > true< / span > ;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00032"  name = "l00032" > < / a > < span  class = "lineno" >    32< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  tgp_padding_a = 16 / < span  class = "keyword" > sizeof< / span > (T);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00033"  name = "l00033" > < / a > < span  class = "lineno" >    33< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  tgp_padding_b = 16 / < span  class = "keyword" > sizeof< / span > (T);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00034"  name = "l00034" > < / a > < span  class = "lineno" >    34< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00035"  name = "l00035" > < / a > < span  class = "lineno" >    35< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  shape_a_cols = (transpose_a ? BM : BK) + tgp_padding_a;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00036"  name = "l00036" > < / a > < span  class = "lineno" >    36< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  shape_b_cols = (transpose_b ? BK : BN) + tgp_padding_b;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00037"  name = "l00037" > < / a > < span  class = "lineno" >    37< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  shape_a_rows = (transpose_a ? BK : BM);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00038"  name = "l00038" > < / a > < span  class = "lineno" >    38< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  shape_b_rows = (transpose_b ? BN : BK);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00039"  name = "l00039" > < / a > < span  class = "lineno" >    39< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  tgp_mem_size_a = shape_a_cols * shape_a_rows;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00040"  name = "l00040" > < / a > < span  class = "lineno" >    40< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  tgp_mem_size_b = shape_b_cols * shape_b_rows;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00041"  name = "l00041" > < / a > < span  class = "lineno" >    41< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00042"  name = "l00042" > < / a > < span  class = "lineno" >    42< / span >   < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  tgp_size = WM * WN * 32;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00043"  name = "l00043" > < / a > < span  class = "lineno" >    43< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00044"  name = "l00044" > < / a > < span  class = "lineno" >    44< / span >   < span  class = "comment" > // Input loader< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00045"  name = "l00045" > < / a > < span  class = "lineno" >    45< / span >   < span  class = "keyword" > using < / span > loader_a_t =< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00046"  name = "l00046" > < / a > < span  class = "lineno" >    46< / span >       Conv2DInputBlockLoaderGeneral< T, BM, BN, BK, tgp_size, tgp_padding_a> ;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00047"  name = "l00047" > < / a > < span  class = "lineno" >    47< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00048"  name = "l00048" > < / a > < span  class = "lineno" >    48< / span >   < span  class = "comment" > // Weight loader< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00049"  name = "l00049" > < / a > < span  class = "lineno" >    49< / span >   < span  class = "keyword" > using < / span > loader_b_t =< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00050"  name = "l00050" > < / a > < span  class = "lineno" >    50< / span >       Conv2DWeightBlockLoaderGeneral< T, BM, BN, BK, tgp_size, tgp_padding_b> ;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00051"  name = "l00051" > < / a > < span  class = "lineno" >    51< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00052"  name = "l00052" > < / a > < span  class = "lineno" >    52< / span >   < span  class = "keyword" > using < / span > mma_t = BlockMMA< < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00053"  name = "l00053" > < / a > < span  class = "lineno" >    53< / span >       T,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00054"  name = "l00054" > < / a > < span  class = "lineno" >    54< / span >       T,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00055"  name = "l00055" > < / a > < span  class = "lineno" >    55< / span >       BM,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00056"  name = "l00056" > < / a > < span  class = "lineno" >    56< / span >       BN,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00057"  name = "l00057" > < / a > < span  class = "lineno" >    57< / span >       BK,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00058"  name = "l00058" > < / a > < span  class = "lineno" >    58< / span >       WM,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00059"  name = "l00059" > < / a > < span  class = "lineno" >    59< / span >       WN,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00060"  name = "l00060" > < / a > < span  class = "lineno" >    60< / span >       transpose_a,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00061"  name = "l00061" > < / a > < span  class = "lineno" >    61< / span >       transpose_b,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00062"  name = "l00062" > < / a > < span  class = "lineno" >    62< / span >       shape_a_cols,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00063"  name = "l00063" > < / a > < span  class = "lineno" >    63< / span >       shape_b_cols> ;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00064"  name = "l00064" > < / a > < span  class = "lineno" >    64< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00065"  name = "l00065" > < / a > < span  class = "lineno" >    65< / span >   threadgroup T As[tgp_mem_size_a];< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00066"  name = "l00066" > < / a > < span  class = "lineno" >    66< / span >   threadgroup T Bs[tgp_mem_size_b];< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00067"  name = "l00067" > < / a > < span  class = "lineno" >    67< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00068"  name = "l00068" > < / a > < span  class = "lineno" >    68< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  tid_y = ((tid.y) < <  gemm_params-> swizzle_log) +< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00069"  name = "l00069" > < / a > < span  class = "lineno" >    69< / span >       ((tid.x) &  ((1 < <  gemm_params-> swizzle_log) - 1));< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00070"  name = "l00070" > < / a > < span  class = "lineno" >    70< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  tid_x = (tid.x) > >  gemm_params-> swizzle_log;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00071"  name = "l00071" > < / a > < span  class = "lineno" >    71< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00072"  name = "l00072" > < / a > < span  class = "lineno" >    72< / span >   < span  class = "keywordflow" > if< / span >  (gemm_params-> tiles_n < = tid_x || gemm_params-> tiles_m < = tid_y) {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00073"  name = "l00073" > < / a > < span  class = "lineno" >    73< / span >     < span  class = "keywordflow" > return< / span > ;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00074"  name = "l00074" > < / a > < span  class = "lineno" >    74< / span >   }< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00075"  name = "l00075" > < / a > < span  class = "lineno" >    75< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00076"  name = "l00076" > < / a > < span  class = "lineno" >    76< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  tid_z = tid.z;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00077"  name = "l00077" > < / a > < span  class = "lineno" >    77< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00078"  name = "l00078" > < / a > < span  class = "lineno" >    78< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  base_oh = tid_z / jump_params-> f_out_jump_w;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00079"  name = "l00079" > < / a > < span  class = "lineno" >    79< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  base_ow = tid_z % jump_params-> f_out_jump_w;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00080"  name = "l00080" > < / a > < span  class = "lineno" >    80< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00081"  name = "l00081" > < / a > < span  class = "lineno" >    81< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  base_wh = base_h[base_oh].weight_base;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00082"  name = "l00082" > < / a > < span  class = "lineno" >    82< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  base_ww = base_w[base_ow].weight_base;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00083"  name = "l00083" > < / a > < span  class = "lineno" >    83< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00084"  name = "l00084" > < / a > < span  class = "lineno" >    84< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  base_wh_size = base_h[base_oh].weight_size;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00085"  name = "l00085" > < / a > < span  class = "lineno" >    85< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  base_ww_size = base_w[base_ow].weight_size;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00086"  name = "l00086" > < / a > < span  class = "lineno" >    86< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00087"  name = "l00087" > < / a > < span  class = "lineno" >    87< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  c_row = tid_y * BM;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00088"  name = "l00088" > < / a > < span  class = "lineno" >    88< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  c_col = tid_x * BN;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00089"  name = "l00089" > < / a > < span  class = "lineno" >    89< / span >   < span  class = "keyword" > const< / span >  < span  class = "keywordtype" > int< / span >  K = gemm_params-> K;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00090"  name = "l00090" > < / a > < span  class = "lineno" >    90< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00091"  name = "l00091" > < / a > < span  class = "lineno" >    91< / span >   B += c_col * K;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00092"  name = "l00092" > < / a > < span  class = "lineno" >    92< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00093"  name = "l00093" > < / a > < span  class = "lineno" >    93< / span >   < span  class = "keyword" > const< / span >  int4 offsets_a(0, c_row, base_oh, base_ow);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00094"  name = "l00094" > < / a > < span  class = "lineno" >    94< / span >   < span  class = "keyword" > const< / span >  int2 offsets_b(0, c_col);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00095"  name = "l00095" > < / a > < span  class = "lineno" >    95< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00096"  name = "l00096" > < / a > < span  class = "lineno" >    96< / span >   < span  class = "comment" > // Prepare threadgroup loading operations< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00097"  name = "l00097" > < / a > < span  class = "lineno" >    97< / span >   loader_a_t loader_a(< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00098"  name = "l00098" > < / a > < span  class = "lineno" >    98< / span >       A,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00099"  name = "l00099" > < / a > < span  class = "lineno" >    99< / span >       As,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00100"  name = "l00100" > < / a > < span  class = "lineno" >   100< / span >       offsets_a,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00101"  name = "l00101" > < / a > < span  class = "lineno" >   101< / span >       params,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00102"  name = "l00102" > < / a > < span  class = "lineno" >   102< / span >       jump_params,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00103"  name = "l00103" > < / a > < span  class = "lineno" >   103< / span >       base_wh,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00104"  name = "l00104" > < / a > < span  class = "lineno" >   104< / span >       base_ww,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00105"  name = "l00105" > < / a > < span  class = "lineno" >   105< / span >       simd_gid,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00106"  name = "l00106" > < / a > < span  class = "lineno" >   106< / span >       simd_lid);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00107"  name = "l00107" > < / a > < span  class = "lineno" >   107< / span >   loader_b_t loader_b(< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00108"  name = "l00108" > < / a > < span  class = "lineno" >   108< / span >       B,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00109"  name = "l00109" > < / a > < span  class = "lineno" >   109< / span >       Bs,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00110"  name = "l00110" > < / a > < span  class = "lineno" >   110< / span >       offsets_b,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00111"  name = "l00111" > < / a > < span  class = "lineno" >   111< / span >       params,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00112"  name = "l00112" > < / a > < span  class = "lineno" >   112< / span >       jump_params,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00113"  name = "l00113" > < / a > < span  class = "lineno" >   113< / span >       base_wh,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00114"  name = "l00114" > < / a > < span  class = "lineno" >   114< / span >       base_ww,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00115"  name = "l00115" > < / a > < span  class = "lineno" >   115< / span >       simd_gid,< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00116"  name = "l00116" > < / a > < span  class = "lineno" >   116< / span >       simd_lid);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00117"  name = "l00117" > < / a > < span  class = "lineno" >   117< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00118"  name = "l00118" > < / a > < span  class = "lineno" >   118< / span >   < span  class = "comment" > // Prepare threadgroup mma operation< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00119"  name = "l00119" > < / a > < span  class = "lineno" >   119< / span >   mma_t mma_op(simd_gid, simd_lid);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00120"  name = "l00120" > < / a > < span  class = "lineno" >   120< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00121"  name = "l00121" > < / a > < span  class = "lineno" >   121< / span >   < span  class = "keywordtype" > int< / span >  gemm_k_iterations =< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00122"  name = "l00122" > < / a > < span  class = "lineno" >   122< / span >       base_wh_size * base_ww_size * gemm_params-> gemm_k_iterations;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00123"  name = "l00123" > < / a > < span  class = "lineno" >   123< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00124"  name = "l00124" > < / a > < span  class = "lineno" >   124< / span >   < span  class = "keywordflow" > for< / span >  (< span  class = "keywordtype" > int< / span >  k = 0; k <  gemm_k_iterations; k++) {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00125"  name = "l00125" > < / a > < span  class = "lineno" >   125< / span >     threadgroup_barrier(mem_flags::mem_threadgroup);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00126"  name = "l00126" > < / a > < span  class = "lineno" >   126< / span >     < span  class = "comment" > // Load elements into threadgroup< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00127"  name = "l00127" > < / a > < span  class = "lineno" >   127< / span >     loader_a.load_unsafe();< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00128"  name = "l00128" > < / a > < span  class = "lineno" >   128< / span >     loader_b.load_unsafe();< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00129"  name = "l00129" > < / a > < span  class = "lineno" >   129< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00130"  name = "l00130" > < / a > < span  class = "lineno" >   130< / span >     threadgroup_barrier(mem_flags::mem_threadgroup);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00131"  name = "l00131" > < / a > < span  class = "lineno" >   131< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00132"  name = "l00132" > < / a > < span  class = "lineno" >   132< / span >     < span  class = "comment" > // Multiply and accumulate threadgroup elements< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00133"  name = "l00133" > < / a > < span  class = "lineno" >   133< / span >     mma_op.mma(As, Bs);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00134"  name = "l00134" > < / a > < span  class = "lineno" >   134< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00135"  name = "l00135" > < / a > < span  class = "lineno" >   135< / span >     < span  class = "comment" > // Prepare for next iteration< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00136"  name = "l00136" > < / a > < span  class = "lineno" >   136< / span >     loader_a.next();< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00137"  name = "l00137" > < / a > < span  class = "lineno" >   137< / span >     loader_b.next();< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00138"  name = "l00138" > < / a > < span  class = "lineno" >   138< / span >   }< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00139"  name = "l00139" > < / a > < span  class = "lineno" >   139< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00140"  name = "l00140" > < / a > < span  class = "lineno" >   140< / span >   threadgroup_barrier(mem_flags::mem_none);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00141"  name = "l00141" > < / a > < span  class = "lineno" >   141< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00142"  name = "l00142" > < / a > < span  class = "lineno" >   142< / span >   < span  class = "comment" > // Store results to device memory< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00143"  name = "l00143" > < / a > < span  class = "lineno" >   143< / span >   {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00144"  name = "l00144" > < / a > < span  class = "lineno" >   144< / span >     < span  class = "comment" > // Adjust for simdgroup and thread locatio< / span > < / div > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-31 03:00:19 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00145"  name = "l00145" > < / a > < span  class = "lineno" >   145< / span >     < span  class = "keywordtype" > int< / span >  offset_m = c_row + mma_op.sm;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00146"  name = "l00146" > < / a > < span  class = "lineno" >   146< / span >     < span  class = "keywordtype" > int< / span >  offset_n = c_col + mma_op.sn;< / div > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00147"  name = "l00147" > < / a > < span  class = "lineno" >   147< / span >     C += offset_n;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00148"  name = "l00148" > < / a > < span  class = "lineno" >   148< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00149"  name = "l00149" > < / a > < span  class = "lineno" >   149< / span >     < span  class = "keywordflow" > if< / span >  (offset_n > = gemm_params-> N)< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00150"  name = "l00150" > < / a > < span  class = "lineno" >   150< / span >       < span  class = "keywordflow" > return< / span > ;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00151"  name = "l00151" > < / a > < span  class = "lineno" >   151< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00152"  name = "l00152" > < / a > < span  class = "lineno" >   152< / span >     < span  class = "keywordtype" > short< / span >  diff = gemm_params-> N - offset_n;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00153"  name = "l00153" > < / a > < span  class = "lineno" >   153< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00154"  name = "l00154" > < / a > < span  class = "lineno" >   154< / span >     < a  class = "code hl_define"  href = "steel_2defines_8h.html#a5a5c3095b132a7589bc19cd5cb80e2c6" > STEEL_PRAGMA_UNROLL< / a > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00155"  name = "l00155" > < / a > < span  class = "lineno" >   155< / span >     < span  class = "keywordflow" > for< / span >  (< span  class = "keywordtype" > int< / span >  i = 0; i <  mma_t::TM; i++) {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00156"  name = "l00156" > < / a > < span  class = "lineno" >   156< / span >       < span  class = "keywordtype" > int< / span >  cm = offset_m + i * mma_t::TM_stride;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00157"  name = "l00157" > < / a > < span  class = "lineno" >   157< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00158"  name = "l00158" > < / a > < span  class = "lineno" >   158< / span >       < span  class = "keywordtype" > int< / span >  n = cm / jump_params-> adj_out_hw;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00159"  name = "l00159" > < / a > < span  class = "lineno" >   159< / span >       < span  class = "keywordtype" > int< / span >  hw = cm % jump_params-> adj_out_hw;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00160"  name = "l00160" > < / a > < span  class = "lineno" >   160< / span >       < span  class = "keywordtype" > int< / span >  oh =< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00161"  name = "l00161" > < / a > < span  class = "lineno" >   161< / span >           (hw / jump_params-> adj_out_w) * jump_params-> f_out_jump_h + base_oh;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00162"  name = "l00162" > < / a > < span  class = "lineno" >   162< / span >       < span  class = "keywordtype" > int< / span >  ow =< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00163"  name = "l00163" > < / a > < span  class = "lineno" >   163< / span >           (hw % jump_params-> adj_out_w) * jump_params-> f_out_jump_w + base_ow;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00164"  name = "l00164" > < / a > < span  class = "lineno" >   164< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00165"  name = "l00165" > < / a > < span  class = "lineno" >   165< / span >       < span  class = "keywordflow" > if< / span >  (n <  params-> N & &  oh <  params-> oS[0] & &  ow <  params-> oS[1]) {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00166"  name = "l00166" > < / a > < span  class = "lineno" >   166< / span >         < span  class = "keywordtype" > int< / span >  offset_cm = n * params-> out_strides[0] +< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00167"  name = "l00167" > < / a > < span  class = "lineno" >   167< / span >             oh * params-> out_strides[1] + ow * params-> out_strides[2];< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00168"  name = "l00168" > < / a > < span  class = "lineno" >   168< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00169"  name = "l00169" > < / a > < span  class = "lineno" >   169< / span >         < a  class = "code hl_define"  href = "steel_2defines_8h.html#a5a5c3095b132a7589bc19cd5cb80e2c6" > STEEL_PRAGMA_UNROLL< / a > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00170"  name = "l00170" > < / a > < span  class = "lineno" >   170< / span >         < span  class = "keywordflow" > for< / span >  (< span  class = "keywordtype" > int< / span >  j = 0; j <  mma_t::TN; j++) {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00171"  name = "l00171" > < / a > < span  class = "lineno" >   171< / span >           < span  class = "comment" > // Get accumulated result and associated offset in C< / span > < / div > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-31 03:00:19 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00172"  name = "l00172" > < / a > < span  class = "lineno" >   172< / span >           thread < span  class = "keyword" > const< / span >  < span  class = "keyword" > auto< / span > &  accum = mma_op.Ctile.frag_at(i, j);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00173"  name = "l00173" > < / a > < span  class = "lineno" >   173< / span >           < span  class = "keywordtype" > int< / span >  offset = offset_cm + (j * mma_t::TN_stride);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00174"  name = "l00174" > < / a > < span  class = "lineno" >   174< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00175"  name = "l00175" > < / a > < span  class = "lineno" >   175< / span >           < span  class = "keyword" > constexpr< / span >  < span  class = "keywordtype" > short< / span >  kelems = < span  class = "keyword" > decltype< / span > (mma_op.Ctile)::kElemsPerFrag;< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00176"  name = "l00176" > < / a > < span  class = "lineno" >   176< / span >  < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00177"  name = "l00177" > < / a > < span  class = "lineno" >   177< / span >           < span  class = "comment" > // Apply epilogue and output C< / span > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00178"  name = "l00178" > < / a > < span  class = "lineno" >   178< / span >           < a  class = "code hl_define"  href = "steel_2defines_8h.html#a5a5c3095b132a7589bc19cd5cb80e2c6" > STEEL_PRAGMA_UNROLL< / a > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00179"  name = "l00179" > < / a > < span  class = "lineno" >   179< / span >           < span  class = "keywordflow" > for< / span >  (< span  class = "keywordtype" > short< / span >  k = 0; k <  kelems; k++) {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00180"  name = "l00180" > < / a > < span  class = "lineno" >   180< / span >             < span  class = "keywordflow" > if< / span >  ((j * mma_t::TN_stride + k) <  diff) {< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00181"  name = "l00181" > < / a > < span  class = "lineno" >   181< / span >               C[offset + k] = Epilogue::apply(accum[k]);< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00182"  name = "l00182" > < / a > < span  class = "lineno" >   182< / span >             }< / div > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00183"  name = "l00183" > < / a > < span  class = "lineno" >   183< / span >           }< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00184"  name = "l00184" > < / a > < span  class = "lineno" >   184< / span >         }< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00185"  name = "l00185" > < / a > < span  class = "lineno" >   185< / span >       }< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00186"  name = "l00186" > < / a > < span  class = "lineno" >   186< / span >     }< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00187"  name = "l00187" > < / a > < span  class = "lineno" >   187< / span >   }< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "line" > < a  id = "l00188"  name = "l00188" > < / a > < span  class = "lineno" >   188< / span > }< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "ttc"  id = "aloader__general_8h_html" > < div  class = "ttname" > < a  href = "loader__general_8h.html" > loader_general.h< / a > < / div > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "ttc"  id = "asteel_2defines_8h_html_a5a5c3095b132a7589bc19cd5cb80e2c6" > < div  class = "ttname" > < a  href = "steel_2defines_8h.html#a5a5c3095b132a7589bc19cd5cb80e2c6" > STEEL_PRAGMA_UNROLL< / a > < / div > < div  class = "ttdeci" > #define STEEL_PRAGMA_UNROLL< / div > < div  class = "ttdef" > < b > Definition< / b >  defines.h:4< / div > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "ttc"  id = "asteel__conv__general_8h_html_ad620c0656ae92e36dcb4a285d9e790ee" > < div  class = "ttname" > < a  href = "steel__conv__general_8h.html#ad620c0656ae92e36dcb4a285d9e790ee" > implicit_gemm_conv_2d_general< / a > < / div > < div  class = "ttdeci" > void implicit_gemm_conv_2d_general(const device T *A, const device T *B, device T *C, const constant MLXConvParams<  2 >  *params, const constant ImplicitGemmConv2DParams *gemm_params, const constant Conv2DGeneralJumpParams *jump_params, const constant Conv2DGeneralBaseInfo *base_h, const constant Conv2DGeneralBaseInfo *base_w, uint3 tid, uint3 lid, uint simd_gid, uint simd_lid)< / div > < div  class = "ttdef" > < b > Definition< / b >  steel_conv_general.h:15< / div > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  class = "ttc"  id = "astruct_m_l_x_conv_params_html" > < div  class = "ttname" > < a  href = "struct_m_l_x_conv_params.html" > MLXConvParams< / a > < / div > < div  class = "ttdef" > < b > Definition< / b >  params.h:6< / div > < / div > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > <!--  fragment  --> < / div > <!--  contents  --> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > <!--  doc - content  --> 
							 
						 
					
						
							
								
									
										
										
										
											2025-01-09 21:56:20 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								<!--  start footer part  --> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< div  id = "nav-path"  class = "navpath" > <!--  id is needed for treeview function!  --> 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								  < ul > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								    < li  class = "navelem" > < a  class = "el"  href = "dir_938ab0ecf10b8b860ff766c820f665fd.html" > mlx< / a > < / li > < li  class = "navelem" > < a  class = "el"  href = "dir_1d446c9bd3c99228254c9484e0bc5c06.html" > backend< / a > < / li > < li  class = "navelem" > < a  class = "el"  href = "dir_d0c977ea65824390717cdb7efc36c157.html" > metal< / a > < / li > < li  class = "navelem" > < a  class = "el"  href = "dir_70a37effa88bcbd6b791977fa1e64356.html" > kernels< / a > < / li > < li  class = "navelem" > < a  class = "el"  href = "dir_76215a6c54e2b67053e723fc2395583c.html" > steel< / a > < / li > < li  class = "navelem" > < a  class = "el"  href = "dir_df9494e83ef22ae6150a0e080d9709ed.html" > conv< / a > < / li > < li  class = "navelem" > < a  class = "el"  href = "dir_6379e541ea5051a09bc0e3fdd92fcd3b.html" > kernels< / a > < / li > < li  class = "navelem" > < a  class = "el"  href = "steel__conv__general_8h.html" > steel_conv_general.h< / a > < / li > 
							 
						 
					
						
							
								
									
										
										
										
											2025-02-06 20:16:29 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								    < li  class = "footer" > Generated by < a  href = "https://www.doxygen.org/index.html" > < img  class = "footer"  src = "doxygen.svg"  width = "104"  height = "31"  alt = "doxygen" / > < / a >  1.13.2 < / li > 
							 
						 
					
						
							
								
									
										
										
										
											2025-01-09 21:56:20 +00:00 
										
									 
								 
							 
							
								
									
										 
									 
								
							 
							
								 
							 
							
							
								  < / ul > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / div > 
							 
						 
					
						
							
								
									
										
										
										
											2024-10-15 15:12:17 +00:00 
										
									 
								 
							 
							
								
							 
							
								 
							 
							
							
								< / body > 
							 
						 
					
						
							
								
							 
							
								
							 
							
								 
							 
							
							
								< / html >