Merge commit 'c7dce2ac29136939b6fe6aabadd026e53dcf35c9' into develop

This commit is contained in:
assistant-librarian[bot]
2025-11-26 02:44:11 +00:00
parent 6d42c1d821
commit 9eb4b35ef6
3 changed files with 74 additions and 25 deletions

View File

@@ -229,13 +229,13 @@ struct UniversalFlatmmPipelineAgBgCrPolicy
template <typename Problem>
CK_TILE_HOST_DEVICE static constexpr index_t GetSmemPackA()
{
using A = remove_cvref_t<typename Problem::ADataType>;
using BlockGemm = remove_cvref_t<decltype(GetBlockGemm<Problem>())>;
using A = remove_cvref_t<typename Problem::ADataType>;
using BlockFlatmm = remove_cvref_t<decltype(GetBlockFlatmm<Problem>())>;
constexpr index_t KPack = static_cast<index_t>(BlockGemm::Traits::KPack);
constexpr index_t VecElems = static_cast<index_t>(Problem::VectorLoadSize / sizeof(A));
constexpr index_t KPack = BlockFlatmm::BlockPolicy::WarpGemm::kKPerThread;
constexpr index_t VecElems = Problem::VectorLoadSize / sizeof(A);
return (KPack < VecElems) ? KPack : VecElems;
return min(KPack, VecElems);
}
template <typename Problem>