mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-07-02 21:27:45 +00:00
debugging warp-level gemm classes
This commit is contained in:
@@ -320,6 +320,17 @@ struct GfxConfig
|
||||
return Gfx90x::kCM0PerLane;
|
||||
}
|
||||
}
|
||||
static constexpr index_t get_k_cm1_per_lane()
|
||||
{
|
||||
if constexpr (GfxId == 1200)
|
||||
{
|
||||
return Gfx120x::kCM1PerLane;
|
||||
}
|
||||
else if constexpr (GfxId == 900)
|
||||
{
|
||||
return Gfx90x::kCM1PerLane;
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
} // namespace ck_tile
|
||||
|
||||
@@ -91,7 +91,7 @@ struct WarpGemmAttributeGenericImplF16F16F32M16N16K16
|
||||
static constexpr index_t kCMLane = GfxConfig<GfxId>::get_k_cm_lane();
|
||||
static constexpr index_t kCNLane = 16;
|
||||
static constexpr index_t kCM0PerLane = GfxConfig<GfxId>::get_k_cm0_per_lane();
|
||||
static constexpr index_t kCM1PerLane = 4;
|
||||
static constexpr index_t kCM1PerLane = GfxConfig<GfxId>::get_k_cm1_per_lane();
|
||||
|
||||
// c_vec += a_vec * b_vec
|
||||
template <bool post_nop_ = false>
|
||||
|
||||
Reference in New Issue
Block a user