mirror of
https://github.com/ml-explore/mlx.git
synced 2025-12-16 01:49:05 +08:00
Add mode parameter for quantization (#2499)
* add mode parameter for quantization * mxfp4 quantize/dequantize + start of optional biases * mxfp4 works * speedup * cpu mxfp4 * fix * fix test tol * fix * refactor * add quant mode enum
This commit is contained in:
@@ -335,7 +335,7 @@ struct PrimitiveFactory {
|
||||
SERIALIZE_PRIMITIVE(Cholesky),
|
||||
SERIALIZE_PRIMITIVE(Eig),
|
||||
SERIALIZE_PRIMITIVE(Eigh),
|
||||
SERIALIZE_PRIMITIVE(AffineQuantize),
|
||||
SERIALIZE_PRIMITIVE(Quantize),
|
||||
SERIALIZE_PRIMITIVE(RMSNorm),
|
||||
SERIALIZE_PRIMITIVE(RMSNormVJP),
|
||||
SERIALIZE_PRIMITIVE(LayerNorm),
|
||||
|
||||
Reference in New Issue
Block a user