mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-03 05:01:25 +00:00
fix mxfp8-gemm example failure (#3531)
Co-authored-by: ZheWang <zhewan@amd.com>
This commit is contained in:
@@ -331,10 +331,15 @@ struct CShuffleEpilogue
|
||||
}
|
||||
else
|
||||
{
|
||||
#if defined(__gfx950__)
|
||||
constexpr auto is_950 = true;
|
||||
#else
|
||||
constexpr auto is_950 = false;
|
||||
#endif
|
||||
constexpr int RakedXDLN_PerWarp = NumNXdlPerWavePerShuffle / BlockedXDLN_PerWarp;
|
||||
// BlockedLayout
|
||||
// this branch is for original a16w4
|
||||
if constexpr(is_any_of<ADataType, pk_int4_t, pk_fp4_t>::value ||
|
||||
if constexpr(is_950 || is_any_of<ADataType, pk_int4_t, pk_fp4_t>::value ||
|
||||
is_any_of<BDataType, pk_int4_t, pk_fp4_t>::value)
|
||||
{
|
||||
return tile_distribution_encoding<
|
||||
|
||||
Reference in New Issue
Block a user