Merge commit 'b7a806f2442ed04db9e835e3e4e14aaebe3db9b4' into develop

This commit is contained in:
assistant-librarian[bot]
2025-09-16 16:13:22 +00:00
parent 1191876ea6
commit 0daa4023fc
16 changed files with 203 additions and 96 deletions

View File

@@ -82,7 +82,11 @@ struct Smoothquant
return dim3(integer_divide_ceil(hargs.m, Block_M));
}
CK_TILE_HOST static constexpr auto BlockSize() { return Problem::BlockShape::BlockSize; }
CK_TILE_HOST static constexpr auto BlockSize()
{
return is_wave32() ? Problem::BlockShape::template GetBlockSize<true>()
: Problem::BlockShape::template GetBlockSize<false>();
}
// clang-format off
template <typename T> struct t2s;