remove lm head if unused (#1324)

This commit is contained in:
Awni Hannun 2025-03-06 15:35:47 -08:00 committed by GitHub
parent 877d2a345b
commit 595f5da146
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -196,9 +196,12 @@ class Model(nn.Module):
def sanitize(self, weights):
# Remove unused precomputed rotary freqs
return {
weights = {
k: v for k, v in weights.items() if "self_attn.rotary_emb.inv_freq" not in k
}
if self.args.tie_word_embeddings:
weights.pop("lm_head.weight", None)
return weights
@property
def layers(self):