mirror of
https://github.com/ml-explore/mlx.git
synced 2025-09-18 10:26:56 +08:00
docs update
This commit is contained in:

committed by
CircleCI Docs

parent
6e9288a41c
commit
f5dcb1c2b9
131
docs/build/html/quantized_8h.html
vendored
131
docs/build/html/quantized_8h.html
vendored
@@ -127,10 +127,10 @@ Functions</h2></td></tr>
|
||||
<tr class="memitem:a9d466e3e3af0d75cfc4eddcf46cb13e4" id="r_a9d466e3e3af0d75cfc4eddcf46cb13e4"><td class="memTemplParams" colspan="2">template<typename T , const int group_size, const int bits> </td></tr>
|
||||
<tr class="memitem:a9d466e3e3af0d75cfc4eddcf46cb13e4"><td class="memTemplItemLeft" align="right" valign="top">METAL_FUNC void </td><td class="memTemplItemRight" valign="bottom"><a class="el" href="#a9d466e3e3af0d75cfc4eddcf46cb13e4">qvm_impl</a> (const device T *x, const device uint32_t *w, const device T *scales, const device T *biases, device T *y, const constant int &in_vec_size, const constant int &out_vec_size, uint3 tid, uint simd_gid, uint simd_lid)</td></tr>
|
||||
<tr class="separator:a9d466e3e3af0d75cfc4eddcf46cb13e4"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:ac7b6accc41b026ef8efc312987aa9efe" id="r_ac7b6accc41b026ef8efc312987aa9efe"><td class="memTemplParams" colspan="2">template<typename T , const int BM, const int BK, const int BN, const int group_size, const int bits, const bool aligned_N> </td></tr>
|
||||
<tr class="memitem:ac7b6accc41b026ef8efc312987aa9efe" id="r_ac7b6accc41b026ef8efc312987aa9efe"><td class="memTemplParams" colspan="2">template<typename T , const int group_size, const int bits, const bool aligned_N, const int BM = 32, const int BK = 32, const int BN = 32> </td></tr>
|
||||
<tr class="memitem:ac7b6accc41b026ef8efc312987aa9efe"><td class="memTemplItemLeft" align="right" valign="top">METAL_FUNC void </td><td class="memTemplItemRight" valign="bottom"><a class="el" href="#ac7b6accc41b026ef8efc312987aa9efe">qmm_t_impl</a> (const device T *x, const device uint32_t *w, const device T *scales, const device T *biases, device T *y, threadgroup T *Xs, threadgroup T *Ws, const constant int &M, const constant int &N, const constant int &K, uint3 tid, uint lid, uint simd_gid, uint simd_lid)</td></tr>
|
||||
<tr class="separator:ac7b6accc41b026ef8efc312987aa9efe"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a5f7b71eef2e328af3225d7c777ffb339" id="r_a5f7b71eef2e328af3225d7c777ffb339"><td class="memTemplParams" colspan="2">template<typename T , const int BM, const int BK, const int BN, const int group_size, const int bits> </td></tr>
|
||||
<tr class="memitem:a5f7b71eef2e328af3225d7c777ffb339" id="r_a5f7b71eef2e328af3225d7c777ffb339"><td class="memTemplParams" colspan="2">template<typename T , const int group_size, const int bits, const int BM = 32, const int BK = 32, const int BN = 32> </td></tr>
|
||||
<tr class="memitem:a5f7b71eef2e328af3225d7c777ffb339"><td class="memTemplItemLeft" align="right" valign="top">METAL_FUNC void </td><td class="memTemplItemRight" valign="bottom"><a class="el" href="#a5f7b71eef2e328af3225d7c777ffb339">qmm_n_impl</a> (const device T *x, const device uint32_t *w, const device T *scales, const device T *biases, device T *y, threadgroup T *Xs, threadgroup T *Ws, const constant int &M, const constant int &N, const constant int &K, uint3 tid, uint lid, uint simd_gid, uint simd_lid)</td></tr>
|
||||
<tr class="separator:a5f7b71eef2e328af3225d7c777ffb339"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a3ab400746ad77be89c30d25638e01698" id="r_a3ab400746ad77be89c30d25638e01698"><td class="memTemplParams" colspan="2">template<typename T > </td></tr>
|
||||
@@ -166,6 +166,15 @@ Functions</h2></td></tr>
|
||||
<tr class="memitem:acfc43edcf0c742ddc090d22cb7229284" id="r_acfc43edcf0c742ddc090d22cb7229284"><td class="memTemplParams" colspan="2">template<typename T , const int group_size, const int bits, const int BM = 32, const int BK = 32, const int BN = 32> </td></tr>
|
||||
<tr class="memitem:acfc43edcf0c742ddc090d22cb7229284"><td class="memTemplItemLeft" align="right" valign="top">void </td><td class="memTemplItemRight" valign="bottom"><a class="el" href="#acfc43edcf0c742ddc090d22cb7229284">bs_qmm_n</a> (const device T *x, const device uint32_t *w, const device T *scales, const device T *biases, const device uint32_t *lhs_indices, const device uint32_t *rhs_indices, device T *y, const constant int &M, const constant int &N, const constant int &K, const constant int &batch_ndims, const constant int *batch_shape, const constant size_t *lhs_strides, const constant size_t *rhs_strides, const constant int &x_batch_ndims, const constant int *x_shape, const constant size_t *x_strides, const constant int &w_batch_ndims, const constant int *w_shape, const constant size_t *w_strides, const constant size_t *s_strides, const constant size_t *b_strides, uint3 tid, uint lid, uint simd_gid, uint simd_lid)</td></tr>
|
||||
<tr class="separator:acfc43edcf0c742ddc090d22cb7229284"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a47610f886f988d84c3e789eb564a6c44" id="r_a47610f886f988d84c3e789eb564a6c44"><td class="memTemplParams" colspan="2">template<typename T , const int group_size, const int bits> </td></tr>
|
||||
<tr class="memitem:a47610f886f988d84c3e789eb564a6c44"><td class="memTemplItemLeft" align="right" valign="top">void </td><td class="memTemplItemRight" valign="bottom"><a class="el" href="#a47610f886f988d84c3e789eb564a6c44">affine_quantize</a> (const device T *w, device uint8_t *out, device T *scales, device T *biases, uint index)</td></tr>
|
||||
<tr class="separator:a47610f886f988d84c3e789eb564a6c44"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:a57cd320aab5fa1abb65f79b0b781f575" id="r_a57cd320aab5fa1abb65f79b0b781f575"><td class="memTemplParams" colspan="2">template<typename T , const int group_size, const int bits> </td></tr>
|
||||
<tr class="memitem:a57cd320aab5fa1abb65f79b0b781f575"><td class="memTemplItemLeft" align="right" valign="top">void </td><td class="memTemplItemRight" valign="bottom"><a class="el" href="#a57cd320aab5fa1abb65f79b0b781f575">affine_quantize_scales_biases</a> (const device T *w, const device T *scales, const device T *biases, device uint8_t *out, uint index)</td></tr>
|
||||
<tr class="separator:a57cd320aab5fa1abb65f79b0b781f575"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
<tr class="memitem:aecc3db76dcae742776e71ec8fca470c5" id="r_aecc3db76dcae742776e71ec8fca470c5"><td class="memTemplParams" colspan="2">template<typename T , const int group_size, const int bits> </td></tr>
|
||||
<tr class="memitem:aecc3db76dcae742776e71ec8fca470c5"><td class="memTemplItemLeft" align="right" valign="top">void </td><td class="memTemplItemRight" valign="bottom"><a class="el" href="#aecc3db76dcae742776e71ec8fca470c5">affine_dequantize</a> (const device uint8_t *w, const device T *scales, const device T *biases, device T *out, uint index)</td></tr>
|
||||
<tr class="separator:aecc3db76dcae742776e71ec8fca470c5"><td class="memSeparator" colspan="2"> </td></tr>
|
||||
</table><table class="memberdecls">
|
||||
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a id="var-members" name="var-members"></a>
|
||||
Variables</h2></td></tr>
|
||||
@@ -304,6 +313,120 @@ template<typename T > </div>
|
||||
</table>
|
||||
</div><div class="memdoc">
|
||||
|
||||
</div>
|
||||
</div>
|
||||
<a id="aecc3db76dcae742776e71ec8fca470c5" name="aecc3db76dcae742776e71ec8fca470c5"></a>
|
||||
<h2 class="memtitle"><span class="permalink"><a href="#aecc3db76dcae742776e71ec8fca470c5">◆ </a></span>affine_dequantize()</h2>
|
||||
|
||||
<div class="memitem">
|
||||
<div class="memproto">
|
||||
<div class="memtemplate">
|
||||
template<typename T , const int group_size, const int bits> </div>
|
||||
<table class="memname">
|
||||
<tr>
|
||||
<td class="memname">void affine_dequantize </td>
|
||||
<td>(</td>
|
||||
<td class="paramtype">const device uint8_t *</td> <td class="paramname"><span class="paramname"><em>w</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">const device T *</td> <td class="paramname"><span class="paramname"><em>scales</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">const device T *</td> <td class="paramname"><span class="paramname"><em>biases</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">device T *</td> <td class="paramname"><span class="paramname"><em>out</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">uint</td> <td class="paramname"><span class="paramname"><em>index</em></span> )</td>
|
||||
</tr>
|
||||
</table>
|
||||
</div><div class="memdoc">
|
||||
|
||||
</div>
|
||||
</div>
|
||||
<a id="a47610f886f988d84c3e789eb564a6c44" name="a47610f886f988d84c3e789eb564a6c44"></a>
|
||||
<h2 class="memtitle"><span class="permalink"><a href="#a47610f886f988d84c3e789eb564a6c44">◆ </a></span>affine_quantize()</h2>
|
||||
|
||||
<div class="memitem">
|
||||
<div class="memproto">
|
||||
<div class="memtemplate">
|
||||
template<typename T , const int group_size, const int bits> </div>
|
||||
<table class="memname">
|
||||
<tr>
|
||||
<td class="memname">void affine_quantize </td>
|
||||
<td>(</td>
|
||||
<td class="paramtype">const device T *</td> <td class="paramname"><span class="paramname"><em>w</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">device uint8_t *</td> <td class="paramname"><span class="paramname"><em>out</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">device T *</td> <td class="paramname"><span class="paramname"><em>scales</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">device T *</td> <td class="paramname"><span class="paramname"><em>biases</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">uint</td> <td class="paramname"><span class="paramname"><em>index</em></span> )</td>
|
||||
</tr>
|
||||
</table>
|
||||
</div><div class="memdoc">
|
||||
|
||||
</div>
|
||||
</div>
|
||||
<a id="a57cd320aab5fa1abb65f79b0b781f575" name="a57cd320aab5fa1abb65f79b0b781f575"></a>
|
||||
<h2 class="memtitle"><span class="permalink"><a href="#a57cd320aab5fa1abb65f79b0b781f575">◆ </a></span>affine_quantize_scales_biases()</h2>
|
||||
|
||||
<div class="memitem">
|
||||
<div class="memproto">
|
||||
<div class="memtemplate">
|
||||
template<typename T , const int group_size, const int bits> </div>
|
||||
<table class="memname">
|
||||
<tr>
|
||||
<td class="memname">void affine_quantize_scales_biases </td>
|
||||
<td>(</td>
|
||||
<td class="paramtype">const device T *</td> <td class="paramname"><span class="paramname"><em>w</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">const device T *</td> <td class="paramname"><span class="paramname"><em>scales</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">const device T *</td> <td class="paramname"><span class="paramname"><em>biases</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">device uint8_t *</td> <td class="paramname"><span class="paramname"><em>out</em>, </span></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="paramkey"></td>
|
||||
<td></td>
|
||||
<td class="paramtype">uint</td> <td class="paramname"><span class="paramname"><em>index</em></span> )</td>
|
||||
</tr>
|
||||
</table>
|
||||
</div><div class="memdoc">
|
||||
|
||||
</div>
|
||||
</div>
|
||||
<a id="acfc43edcf0c742ddc090d22cb7229284" name="acfc43edcf0c742ddc090d22cb7229284"></a>
|
||||
@@ -1275,7 +1398,7 @@ template<typename T , const int group_size, const int bits, const int BM = 32
|
||||
<div class="memitem">
|
||||
<div class="memproto">
|
||||
<div class="memtemplate">
|
||||
template<typename T , const int BM, const int BK, const int BN, const int group_size, const int bits> </div>
|
||||
template<typename T , const int group_size, const int bits, const int BM = 32, const int BK = 32, const int BN = 32> </div>
|
||||
<table class="memname">
|
||||
<tr>
|
||||
<td class="memname">METAL_FUNC void qmm_n_impl </td>
|
||||
@@ -1431,7 +1554,7 @@ template<typename T , const int group_size, const int bits, const bool aligne
|
||||
<div class="memitem">
|
||||
<div class="memproto">
|
||||
<div class="memtemplate">
|
||||
template<typename T , const int BM, const int BK, const int BN, const int group_size, const int bits, const bool aligned_N> </div>
|
||||
template<typename T , const int group_size, const int bits, const bool aligned_N, const int BM = 32, const int BK = 32, const int BN = 32> </div>
|
||||
<table class="memname">
|
||||
<tr>
|
||||
<td class="memname">METAL_FUNC void qmm_t_impl </td>
|
||||
|
Reference in New Issue
Block a user