mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 14:29:05 +00:00
Fix merge mfma_wmma (part 1) regression (#2749)
root cause: a typo in GetGfx11InputBlkIdx, const ia added by mistake.
This commit is contained in:
@@ -1937,7 +1937,7 @@ struct XdlopsGemm
|
||||
template <bool SwizzleA>
|
||||
__device__ static auto GetGfx11InputBlkIdx()
|
||||
{
|
||||
const auto laneId = GetLaneId() % mfma_instr.num_threads_per_blk;
|
||||
auto laneId = GetLaneId() % mfma_instr.num_threads_per_blk;
|
||||
if constexpr(SwizzleA)
|
||||
{
|
||||
laneId = ((laneId & 1) << 3) | (laneId >> 1);
|
||||
|
||||
Reference in New Issue
Block a user