Merge pull request #102 from burakbudanur/main

Corrected the typo in 'ffn_dim_multiplier' in and added 'rope_theta' …
This commit is contained in:
Awni Hannun 2023-12-14 07:12:20 -08:00 committed by GitHub
commit 363108d7b3
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -315,7 +315,7 @@ def load_model(model_path):
config["hidden_dim"] = weights["layers.0.feed_forward.w1.weight"].shape[0]
if config.get("vocab_size", -1) < 0:
config["vocab_size"] = weights["output.weight"].shape[-1]
unused = ["multiple_of", "ffn_dim_multiplie"]
unused = ["multiple_of", "ffn_dim_multiplier", 'rope_theta']
for k in unused:
if k in config:
config.pop(k)