mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-07-03 13:48:30 +00:00
flag and barrier fix for copmiler branch MainOpSelV3
This commit is contained in:
@@ -286,7 +286,7 @@ struct BlockwiseGemmXdlops_pipeline_moe_blockscale_bpreshuffle_v3<
|
||||
{
|
||||
__builtin_amdgcn_sched_group_barrier(0x100, ds_read_a_mfma_rate, 0); // DS read
|
||||
}
|
||||
__builtin_amdgcn_sched_group_barrier(0x800, 2, 0); // v_pk_fma
|
||||
// __builtin_amdgcn_sched_group_barrier(0x800, 2, 0); // v_pk_fma
|
||||
});
|
||||
// __builtin_amdgcn_sched_barrier(0);
|
||||
});
|
||||
@@ -319,7 +319,7 @@ struct BlockwiseGemmXdlops_pipeline_moe_blockscale_bpreshuffle_v3<
|
||||
{
|
||||
__builtin_amdgcn_sched_group_barrier(0x100, ds_read_a_mfma_rate, 0); // DS read
|
||||
}
|
||||
__builtin_amdgcn_sched_group_barrier(0x800, 2, 0); // v_pk_fma
|
||||
// __builtin_amdgcn_sched_group_barrier(0x800, 2, 0); // v_pk_fma
|
||||
});
|
||||
// __builtin_amdgcn_sched_barrier(0);
|
||||
});
|
||||
@@ -338,7 +338,7 @@ struct BlockwiseGemmXdlops_pipeline_moe_blockscale_bpreshuffle_v3<
|
||||
{
|
||||
__builtin_amdgcn_sched_group_barrier(0x100, ds_read_a_mfma_rate, 0); // DS read
|
||||
}
|
||||
__builtin_amdgcn_sched_group_barrier(0x800, 2, 0); // v_pk_fma
|
||||
// __builtin_amdgcn_sched_group_barrier(0x800, 2, 0); // v_pk_fma
|
||||
});
|
||||
// __builtin_amdgcn_sched_barrier(0);
|
||||
});
|
||||
|
||||
Reference in New Issue
Block a user