mirror of
https://github.com/ml-explore/mlx.git
synced 2025-08-02 16:56:46 +08:00
Disable hd=128 until further optimizations
This commit is contained in:
parent
990b1acc75
commit
0404037ea6
@ -644,7 +644,7 @@ array scaled_dot_product_attention(
|
||||
const bool sdpa_vector_supported_head_dim =
|
||||
query_head_dim == 64 || query_head_dim == 96 || query_head_dim == 128;
|
||||
const bool sdpa_full_supported_head_dim =
|
||||
query_head_dim == 64 || query_head_dim == 80 || query_head_dim == 128;
|
||||
query_head_dim == 64 || query_head_dim == 80;
|
||||
|
||||
const bool supports_sdpa_full = query_sequence_length >= threshold &&
|
||||
!mask.has_value() && sdpa_full_supported_head_dim &&
|
||||
|
Loading…
Reference in New Issue
Block a user