Add support for phi-3 (#712)

* Add phi-3 modelling

* fix rope scaling warning

* add tests and update tuner utils

* update name and remove sanitize

* fix lora
This commit is contained in:
Prince Canuma
2024-04-23 18:20:00 +02:00
committed by GitHub
parent ecbc6ff1e3
commit abcd891851
3 changed files with 208 additions and 0 deletions

View File

@@ -86,6 +86,8 @@ def linear_to_lora_layers(
keys.add("mlp.shared_expert_gate")
elif model.model_type == "olmo":
keys = set(["att_proj"])
elif model.model_type == "phi3":
keys = set(["self_attn.qkv_proj"])
elif model.model_type == "phi-msft":
keys = set(["mixer.Wqkv", "moe.gate"])
elif model.model_type == "dbrx":