Fix SDPA kernel bug on Mac OS 13.3 SDK (#805)

* Move sdpa kernel to allocate tgp mem statically and allow macOS 13.3 SDK builds

* Style
This commit is contained in:
Jagrit Digani
2024-03-07 10:18:09 -08:00
committed by GitHub
parent b7588fd5d7
commit ec8a4864fa
3 changed files with 6 additions and 5 deletions

View File

@@ -97,8 +97,6 @@ void sdpa_metal(
set_array_buffer(compute_encoder, p_lse, 6);
set_array_buffer(compute_encoder, p_rowmaxes, 7);
constexpr const uint tgroupMemorySize = 32768;
compute_encoder->setThreadgroupMemoryLength(tgroupMemorySize, 0);
compute_encoder->dispatchThreadgroups(grid_dims, group_dims);
{