fix transformer decoder post norm LN (#1637)

2025-12-16 01:49:05 +08:00 · 2024-12-02 07:02:17 -08:00
parent 974bb54ab2
commit aa86876813
1 changed files with 1 additions and 1 deletions
--- a/python/mlx/nn/layers/transformer.py
+++ b/python/mlx/nn/layers/transformer.py
@@ -238,7 +238,7 @@ class TransformerDecoderLayer(Module):

            y = self.cross_attention(y, memory, memory, memory_mask)
            y = self.dropout2(y)
-            x = self.ln1(x + y)
+            x = self.ln2(x + y)

            y = self.linear1(x)
            y = self.activation(y)