revert to act_fn to silu

This commit is contained in:
Prince Canuma 2024-12-14 16:22:00 +01:00
parent d7c64c621a
commit 5d8b36ce7c

View File

@ -115,7 +115,7 @@ class MLP(nn.Module):
self.down_proj = nn.Linear(hidden_dim, dim, bias=False)
def __call__(self, x):
return self.down_proj(nn.gelu(self.gate_proj(x)) * self.up_proj(x))
return self.down_proj(nn.silu(self.gate_proj(x)) * self.up_proj(x))
class TransformerBlock(nn.Module):