Disable hd=128 until further optimizations

This commit is contained in:
Jagrit Digani 2024-11-21 11:21:38 -08:00
parent 990b1acc75
commit 0404037ea6

View File

@ -644,7 +644,7 @@ array scaled_dot_product_attention(
const bool sdpa_vector_supported_head_dim = const bool sdpa_vector_supported_head_dim =
query_head_dim == 64 || query_head_dim == 96 || query_head_dim == 128; query_head_dim == 64 || query_head_dim == 96 || query_head_dim == 128;
const bool sdpa_full_supported_head_dim = const bool sdpa_full_supported_head_dim =
query_head_dim == 64 || query_head_dim == 80 || query_head_dim == 128; query_head_dim == 64 || query_head_dim == 80;
const bool supports_sdpa_full = query_sequence_length >= threshold && const bool supports_sdpa_full = query_sequence_length >= threshold &&
!mask.has_value() && sdpa_full_supported_head_dim && !mask.has_value() && sdpa_full_supported_head_dim &&