mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-16 02:54:21 +00:00
Merge commit '95e4a4efcb967b806dbad401c79c31abb7ffed47' into develop
This commit is contained in:
@@ -1937,7 +1937,7 @@ struct XdlopsGemm
|
||||
template <bool SwizzleA>
|
||||
__device__ static auto GetGfx11InputBlkIdx()
|
||||
{
|
||||
const auto laneId = GetLaneId() % mfma_instr.num_threads_per_blk;
|
||||
auto laneId = GetLaneId() % mfma_instr.num_threads_per_blk;
|
||||
if constexpr(SwizzleA)
|
||||
{
|
||||
laneId = ((laneId & 1) << 3) | (laneId >> 1);
|
||||
|
||||
Reference in New Issue
Block a user