fix mismatch

This commit is contained in:
tianyi 2025-07-22 18:00:42 +08:00
parent b2f0ebe9ee
commit 7df3a2887d

View File

@ -259,10 +259,10 @@ void qmv_no_parallel_m(
const Stream& s) { const Stream& s) {
int B = out.size() / M / N; int B = out.size() / M / N;
int bn = 128; int bn = 8;
// int bk = 32; int bk = 32;
MTL::Size group_dims(2, 1, 1); MTL::Size group_dims(bk, 2, 1);
MTL::Size grid_dims((N + bn - 1) / bn, 1, B); MTL::Size grid_dims(1, (N + bn - 1) / bn, B);
std::string kname; std::string kname;
kname.reserve(64); kname.reserve(64);