mirror of
https://github.com/ml-explore/mlx.git
synced 2025-09-18 18:28:12 +08:00
rebase
This commit is contained in:
@@ -97,8 +97,8 @@ $(function(){ initResizable(false); });
|
||||
<table class="memberdecls">
|
||||
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a id="pub-methods" name="pub-methods"></a>
|
||||
Public Member Functions</h2></td></tr>
|
||||
<tr class="memitem:af59b054750a65e7e79c1cd05c4acac93" id="r_af59b054750a65e7e79c1cd05c4acac93"><td class="memItemLeft" align="right" valign="top"> </td><td class="memItemRight" valign="bottom"><a class="el" href="#af59b054750a65e7e79c1cd05c4acac93">QuantizedBlockLoader</a> (const device uint32_t *src_, const device T *scales_, const device T *biases_, const int src_ld_, threadgroup T *dst_, ushort simd_group_id, ushort simd_lane_id)</td></tr>
|
||||
<tr class="separator:af59b054750a65e7e79c1cd05c4acac93"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a60713ce7498aa683cbb2a0f19ab16589" id="r_a60713ce7498aa683cbb2a0f19ab16589"><td class="memItemLeft" align="right" valign="top"> </td><td class="memItemRight" valign="bottom"><a class="el" href="#a60713ce7498aa683cbb2a0f19ab16589">QuantizedBlockLoader</a> (const device uint8_t *src_, const device T *scales_, const device T *biases_, const int src_ld_, threadgroup T *dst_, ushort simd_group_id, ushort simd_lane_id)</td></tr>
|
||||
<tr class="separator:a60713ce7498aa683cbb2a0f19ab16589"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a86009527cb4b53e4c21fd6b1f78cfefc" id="r_a86009527cb4b53e4c21fd6b1f78cfefc"><td class="memItemLeft" align="right" valign="top">void </td><td class="memItemRight" valign="bottom"><a class="el" href="#a86009527cb4b53e4c21fd6b1f78cfefc">load_unsafe</a> () const</td></tr>
|
||||
<tr class="separator:a86009527cb4b53e4c21fd6b1f78cfefc"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a699dc9aa284b8fbf870310bbb224465b" id="r_a699dc9aa284b8fbf870310bbb224465b"><td class="memItemLeft" align="right" valign="top">void </td><td class="memItemRight" valign="bottom"><a class="el" href="#a699dc9aa284b8fbf870310bbb224465b">load_safe</a> (short2 src_tile_dim) const</td></tr>
|
||||
@@ -124,8 +124,8 @@ Public Attributes</h2></td></tr>
|
||||
<tr class="separator:ae2add92b2aaf3414e91f0470b9b0cc00"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a9857214690fe6abad0e19d1045152f83" id="r_a9857214690fe6abad0e19d1045152f83"><td class="memItemLeft" align="right" valign="top">threadgroup T * </td><td class="memItemRight" valign="bottom"><a class="el" href="#a9857214690fe6abad0e19d1045152f83">dst</a></td></tr>
|
||||
<tr class="separator:a9857214690fe6abad0e19d1045152f83"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:ad85c6b7e07c81307b3b91eb4dd7be30b" id="r_ad85c6b7e07c81307b3b91eb4dd7be30b"><td class="memItemLeft" align="right" valign="top">const device uint32_t * </td><td class="memItemRight" valign="bottom"><a class="el" href="#ad85c6b7e07c81307b3b91eb4dd7be30b">src</a></td></tr>
|
||||
<tr class="separator:ad85c6b7e07c81307b3b91eb4dd7be30b"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:abbf8249ca99e3e87b296ddd60a984b76" id="r_abbf8249ca99e3e87b296ddd60a984b76"><td class="memItemLeft" align="right" valign="top">const device uint8_t * </td><td class="memItemRight" valign="bottom"><a class="el" href="#abbf8249ca99e3e87b296ddd60a984b76">src</a></td></tr>
|
||||
<tr class="separator:abbf8249ca99e3e87b296ddd60a984b76"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a6123e4a9209d6eacb58b2c2344ed1ecf" id="r_a6123e4a9209d6eacb58b2c2344ed1ecf"><td class="memItemLeft" align="right" valign="top">const device T * </td><td class="memItemRight" valign="bottom"><a class="el" href="#a6123e4a9209d6eacb58b2c2344ed1ecf">scales</a></td></tr>
|
||||
<tr class="separator:a6123e4a9209d6eacb58b2c2344ed1ecf"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a17d01a6aba0833b073586ef2c09d0fbd" id="r_a17d01a6aba0833b073586ef2c09d0fbd"><td class="memItemLeft" align="right" valign="top">const device T * </td><td class="memItemRight" valign="bottom"><a class="el" href="#a17d01a6aba0833b073586ef2c09d0fbd">biases</a></td></tr>
|
||||
@@ -133,8 +133,10 @@ Public Attributes</h2></td></tr>
|
||||
</table><table class="memberdecls">
|
||||
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a id="pub-static-attribs" name="pub-static-attribs"></a>
|
||||
Static Public Attributes</h2></td></tr>
|
||||
<tr class="memitem:a8eae73a0c04bf1e41fb96131f6aa500d" id="r_a8eae73a0c04bf1e41fb96131f6aa500d"><td class="memItemLeft" align="right" valign="top">static constant constexpr const short </td><td class="memItemRight" valign="bottom"><a class="el" href="#a8eae73a0c04bf1e41fb96131f6aa500d">pack_factor</a> = 32 / bits</td></tr>
|
||||
<tr class="memitem:a8eae73a0c04bf1e41fb96131f6aa500d" id="r_a8eae73a0c04bf1e41fb96131f6aa500d"><td class="memItemLeft" align="right" valign="top">static constant constexpr const short </td><td class="memItemRight" valign="bottom"><a class="el" href="#a8eae73a0c04bf1e41fb96131f6aa500d">pack_factor</a> = bits == 3 ? 8 : bits == 6 ? 4 : 8 / bits</td></tr>
|
||||
<tr class="separator:a8eae73a0c04bf1e41fb96131f6aa500d"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:ad00fe6d8bd395206a41693a8ed65d4db" id="r_ad00fe6d8bd395206a41693a8ed65d4db"><td class="memItemLeft" align="right" valign="top">static constant constexpr const short </td><td class="memItemRight" valign="bottom"><a class="el" href="#ad00fe6d8bd395206a41693a8ed65d4db">bytes_per_pack</a> = (bits == 3 || bits == 6) ? 3 : 1</td></tr>
|
||||
<tr class="separator:ad00fe6d8bd395206a41693a8ed65d4db"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a1392a5278cf6e090ea80ebe7c4ac5fbb" id="r_a1392a5278cf6e090ea80ebe7c4ac5fbb"><td class="memItemLeft" align="right" valign="top">static constant constexpr const short </td><td class="memItemRight" valign="bottom"><a class="el" href="#a1392a5278cf6e090ea80ebe7c4ac5fbb">BCOLS_PACKED</a> = BCOLS / <a class="el" href="#a8eae73a0c04bf1e41fb96131f6aa500d">pack_factor</a></td></tr>
|
||||
<tr class="separator:a1392a5278cf6e090ea80ebe7c4ac5fbb"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a6213479f7a6d9314d8879f8856b0b6fb" id="r_a6213479f7a6d9314d8879f8856b0b6fb"><td class="memItemLeft" align="right" valign="top">static constant constexpr const short </td><td class="memItemRight" valign="bottom"><a class="el" href="#a6213479f7a6d9314d8879f8856b0b6fb">n_reads</a></td></tr>
|
||||
@@ -143,8 +145,8 @@ Static Public Attributes</h2></td></tr>
|
||||
<tr class="separator:a31e14175f3d4902d9fe5ab5a219f61ba"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
</table>
|
||||
<h2 class="groupheader">Constructor & Destructor Documentation</h2>
|
||||
<a id="af59b054750a65e7e79c1cd05c4acac93" name="af59b054750a65e7e79c1cd05c4acac93"></a>
|
||||
<h2 class="memtitle"><span class="permalink"><a href="#af59b054750a65e7e79c1cd05c4acac93">◆ </a></span>QuantizedBlockLoader()</h2>
|
||||
<a id="a60713ce7498aa683cbb2a0f19ab16589" name="a60713ce7498aa683cbb2a0f19ab16589"></a>
|
||||
<h2 class="memtitle"><span class="permalink"><a href="#a60713ce7498aa683cbb2a0f19ab16589">◆ </a></span>QuantizedBlockLoader()</h2>
|
||||
|
||||
<div class="memitem">
|
||||
<div class="memproto">
|
||||
@@ -157,7 +159,7 @@ template<typename T , short BROWS, short BCOLS, short dst_ld, short reduction
|
||||
<tr>
|
||||
<td class="memname"><a class="el" href="struct_quantized_block_loader.html">QuantizedBlockLoader</a>< T, BROWS, BCOLS, dst_ld, reduction_dim, tgp_size, group_size, bits ><a class="el" href="struct_quantized_block_loader.html">::QuantizedBlockLoader</a> </td>
|
||||
<td>(</td>
|
||||
<td class="paramtype">const device uint32_t *</td> <td class="paramname"><span class="paramname"><em>src_</em></span>, </td>
|
||||
<td class="paramtype">const device uint8_t *</td> <td class="paramname"><span class="paramname"><em>src_</em></span>, </td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
@@ -352,6 +354,30 @@ template<typename T , short BROWS, short BCOLS, short dst_ld, short reduction
|
||||
</table>
|
||||
</div><div class="memdoc">
|
||||
|
||||
</div>
|
||||
</div>
|
||||
<a id="ad00fe6d8bd395206a41693a8ed65d4db" name="ad00fe6d8bd395206a41693a8ed65d4db"></a>
|
||||
<h2 class="memtitle"><span class="permalink"><a href="#ad00fe6d8bd395206a41693a8ed65d4db">◆ </a></span>bytes_per_pack</h2>
|
||||
|
||||
<div class="memitem">
|
||||
<div class="memproto">
|
||||
<div class="memtemplate">
|
||||
template<typename T , short BROWS, short BCOLS, short dst_ld, short reduction_dim, short tgp_size, short group_size, short bits> </div>
|
||||
<table class="mlabels">
|
||||
<tr>
|
||||
<td class="mlabels-left">
|
||||
<table class="memname">
|
||||
<tr>
|
||||
<td class="memname">constant constexpr const short <a class="el" href="struct_quantized_block_loader.html">QuantizedBlockLoader</a>< T, BROWS, BCOLS, dst_ld, reduction_dim, tgp_size, group_size, bits >::bytes_per_pack = (bits == 3 || bits == 6) ? 3 : 1</td>
|
||||
</tr>
|
||||
</table>
|
||||
</td>
|
||||
<td class="mlabels-right">
|
||||
<span class="mlabels"><span class="mlabel">static</span><span class="mlabel">constexpr</span></span> </td>
|
||||
</tr>
|
||||
</table>
|
||||
</div><div class="memdoc">
|
||||
|
||||
</div>
|
||||
</div>
|
||||
<a id="a9857214690fe6abad0e19d1045152f83" name="a9857214690fe6abad0e19d1045152f83"></a>
|
||||
@@ -449,7 +475,7 @@ template<typename T , short BROWS, short BCOLS, short dst_ld, short reduction
|
||||
</div><div class="memdoc">
|
||||
<b>Initial value:</b><div class="fragment"><div class="line">=</div>
|
||||
<div class="line"> (<a class="code hl_variable" href="#a1392a5278cf6e090ea80ebe7c4ac5fbb">BCOLS_PACKED</a> * BROWS < tgp_size) ? 1 : (<a class="code hl_variable" href="#a1392a5278cf6e090ea80ebe7c4ac5fbb">BCOLS_PACKED</a> * BROWS) / tgp_size</div>
|
||||
<div class="ttc" id="astruct_quantized_block_loader_html_a1392a5278cf6e090ea80ebe7c4ac5fbb"><div class="ttname"><a href="#a1392a5278cf6e090ea80ebe7c4ac5fbb">QuantizedBlockLoader::BCOLS_PACKED</a></div><div class="ttdeci">static constant constexpr const short BCOLS_PACKED</div><div class="ttdef"><b>Definition</b> quantized.h:274</div></div>
|
||||
<div class="ttc" id="astruct_quantized_block_loader_html_a1392a5278cf6e090ea80ebe7c4ac5fbb"><div class="ttname"><a href="#a1392a5278cf6e090ea80ebe7c4ac5fbb">QuantizedBlockLoader::BCOLS_PACKED</a></div><div class="ttdeci">static constant constexpr const short BCOLS_PACKED</div><div class="ttdef"><b>Definition</b> quantized.h:456</div></div>
|
||||
</div><!-- fragment -->
|
||||
</div>
|
||||
</div>
|
||||
@@ -465,7 +491,7 @@ template<typename T , short BROWS, short BCOLS, short dst_ld, short reduction
|
||||
<td class="mlabels-left">
|
||||
<table class="memname">
|
||||
<tr>
|
||||
<td class="memname">constant constexpr const short <a class="el" href="struct_quantized_block_loader.html">QuantizedBlockLoader</a>< T, BROWS, BCOLS, dst_ld, reduction_dim, tgp_size, group_size, bits >::pack_factor = 32 / bits</td>
|
||||
<td class="memname">constant constexpr const short <a class="el" href="struct_quantized_block_loader.html">QuantizedBlockLoader</a>< T, BROWS, BCOLS, dst_ld, reduction_dim, tgp_size, group_size, bits >::pack_factor = bits == 3 ? 8 : bits == 6 ? 4 : 8 / bits</td>
|
||||
</tr>
|
||||
</table>
|
||||
</td>
|
||||
@@ -493,8 +519,8 @@ template<typename T , short BROWS, short BCOLS, short dst_ld, short reduction
|
||||
|
||||
</div>
|
||||
</div>
|
||||
<a id="ad85c6b7e07c81307b3b91eb4dd7be30b" name="ad85c6b7e07c81307b3b91eb4dd7be30b"></a>
|
||||
<h2 class="memtitle"><span class="permalink"><a href="#ad85c6b7e07c81307b3b91eb4dd7be30b">◆ </a></span>src</h2>
|
||||
<a id="abbf8249ca99e3e87b296ddd60a984b76" name="abbf8249ca99e3e87b296ddd60a984b76"></a>
|
||||
<h2 class="memtitle"><span class="permalink"><a href="#abbf8249ca99e3e87b296ddd60a984b76">◆ </a></span>src</h2>
|
||||
|
||||
<div class="memitem">
|
||||
<div class="memproto">
|
||||
@@ -502,7 +528,7 @@ template<typename T , short BROWS, short BCOLS, short dst_ld, short reduction
|
||||
template<typename T , short BROWS, short BCOLS, short dst_ld, short reduction_dim, short tgp_size, short group_size, short bits> </div>
|
||||
<table class="memname">
|
||||
<tr>
|
||||
<td class="memname">const device uint32_t* <a class="el" href="struct_quantized_block_loader.html">QuantizedBlockLoader</a>< T, BROWS, BCOLS, dst_ld, reduction_dim, tgp_size, group_size, bits >::src</td>
|
||||
<td class="memname">const device uint8_t* <a class="el" href="struct_quantized_block_loader.html">QuantizedBlockLoader</a>< T, BROWS, BCOLS, dst_ld, reduction_dim, tgp_size, group_size, bits >::src</td>
|
||||
</tr>
|
||||
</table>
|
||||
</div><div class="memdoc">
|
||||
|
Reference in New Issue
Block a user