Hub: Update quantization configuration fields

This commit is contained in:
madroid
2024-08-27 15:04:19 +08:00
parent bf21789b17
commit 8cdc91a92e

View File

@@ -646,7 +646,7 @@ def quantize_model(
"""
quantized_config = copy.deepcopy(config)
nn.quantize(model, q_group_size, q_bits)
quantized_config["quantization"] = {"group_size": q_group_size, "bits": q_bits}
quantized_config["quantization_config"] = {"group_size": q_group_size, "bits": q_bits}
quantized_weights = dict(tree_flatten(model.parameters()))
return quantized_weights, quantized_config