* dbrx

* format

* format

* comments

* change scores slightly

* remove inadvertant import
This commit is contained in:
Awni Hannun
2024-03-28 21:03:53 -07:00
committed by GitHub
parent 297a908e3d
commit b80adbcc3e
4 changed files with 259 additions and 3 deletions

View File

@@ -60,6 +60,8 @@ def linear_to_lora_layers(
keys = set(["att_proj"])
elif model.model_type == "phi-msft":
keys = set(["mixer.Wqkv", "moe.gate"])
elif model.model_type == "dbrx":
keys = set(["norm_attn_norm.attn.Wqkv", "ffn.router.layer"])
else:
raise ValueError(f"Lora does not support {model.model_type}")