mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-17 03:19:48 +00:00
Merge commit 'de6a9590abe907283e189abba1b487f8e5562d1b' into develop
This commit is contained in:
10
include/ck_tile/ops/flatmm/pipeline/flatmm_pipeline_agmem_bgmem_creg_v1_policy.hpp
Normal file → Executable file
10
include/ck_tile/ops/flatmm/pipeline/flatmm_pipeline_agmem_bgmem_creg_v1_policy.hpp
Normal file → Executable file
@@ -227,9 +227,15 @@ struct UniversalFlatmmPipelineAgBgCrPolicy
|
||||
}
|
||||
|
||||
template <typename Problem>
|
||||
CK_TILE_HOST_DEVICE static constexpr auto GetSmemPackA()
|
||||
CK_TILE_HOST_DEVICE static constexpr index_t GetSmemPackA()
|
||||
{
|
||||
return Problem::VectorLoadSize / sizeof(typename Problem::ADataType);
|
||||
using A = remove_cvref_t<typename Problem::ADataType>;
|
||||
using BlockGemm = remove_cvref_t<decltype(GetBlockGemm<Problem>())>;
|
||||
|
||||
constexpr index_t KPack = static_cast<index_t>(BlockGemm::Traits::KPack);
|
||||
constexpr index_t VecElems = static_cast<index_t>(Problem::VectorLoadSize / sizeof(A));
|
||||
|
||||
return (KPack < VecElems) ? KPack : VecElems;
|
||||
}
|
||||
|
||||
template <typename Problem>
|
||||
|
||||
Reference in New Issue
Block a user