mirror of
https://github.com/ml-explore/mlx-examples.git
synced 2025-09-02 05:04:37 +08:00
Hub: Update quantization configuration fields
This commit is contained in:
@@ -646,7 +646,7 @@ def quantize_model(
|
||||
"""
|
||||
quantized_config = copy.deepcopy(config)
|
||||
nn.quantize(model, q_group_size, q_bits)
|
||||
quantized_config["quantization"] = {"group_size": q_group_size, "bits": q_bits}
|
||||
quantized_config["quantization_config"] = {"group_size": q_group_size, "bits": q_bits}
|
||||
quantized_weights = dict(tree_flatten(model.parameters()))
|
||||
|
||||
return quantized_weights, quantized_config
|
||||
|
Reference in New Issue
Block a user