This commit is contained in:
Alex Barron 2024-10-31 12:06:34 -07:00
parent 2e0690374e
commit 1d53354b51
2 changed files with 2 additions and 2 deletions

View File

@ -191,7 +191,7 @@ class Attention(nn.Module):
keys = self.rope(keys)
output = scaled_dot_product_attention(
queries, keys, values, cache=cache, cache=cache, scale=self.scale, mask=mask
queries, keys, values, cache=cache, scale=self.scale, mask=mask
)
output = output.transpose(0, 2, 1, 3).reshape(B, L, -1)

View File

@ -90,7 +90,7 @@ class Attention(nn.Module):
keys = self.rope(keys)
output = scaled_dot_product_attention(
queries, keys, values, cache=cache, cache=cache, scale=self.scale, mask=mask
queries, keys, values, cache=cache, scale=self.scale, mask=mask
)
output = output.transpose(0, 2, 1, 3).reshape(B, L, -1)
return self.o_proj(output)