mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-15 18:42:06 +00:00
Moving code-lines in hstu pipeline
This commit is contained in:
@@ -414,6 +414,8 @@ struct HstuAttentionFwdPipelineQRKSVS
|
||||
|
||||
pcomp_tile = cast_tile<CompDataType>(sacc_tile);
|
||||
|
||||
tile_elementwise_inout(f_silu, pcomp_tile);
|
||||
|
||||
if constexpr(std::is_same_v<VLayout, ck_tile::tensor_layout::gemm::RowMajor>)
|
||||
{
|
||||
auto v_shuffle_tmp = make_static_distributed_tensor<QKVDataType>(
|
||||
@@ -436,10 +438,6 @@ struct HstuAttentionFwdPipelineQRKSVS
|
||||
tile_elementwise_in(v_element_func, v_tile)); // store the prefetch
|
||||
};
|
||||
|
||||
__builtin_amdgcn_sched_barrier(0);
|
||||
|
||||
tile_elementwise_inout(f_silu, pcomp_tile);
|
||||
|
||||
if constexpr(kHasDropout)
|
||||
{
|
||||
auto randval_lds_ptr = reinterpret_cast<char*>(smem_ptr) +
|
||||
|
||||
Reference in New Issue
Block a user