Remove useless codes in the two trload pipelines

This commit is contained in:
Qianfeng Zhang
2025-11-15 13:48:00 +00:00
parent 238b5c4f08
commit b75077475b
2 changed files with 2 additions and 18 deletions

View File

@@ -70,9 +70,6 @@ struct HstuAttentionNoSoftmaxFwdPipelineQRKSVSTrLoad
static constexpr index_t kAlignmentBias =
kPadSeqLenK ? 1 : Policy::template GetAlignmentBias<Problem>();
static constexpr index_t kGemmSingleRepM = Policy::template GetQKBlockGemmSingleRepM<Problem>();
static constexpr index_t kGemmNumRepM = kM0 / kGemmSingleRepM;
// used by NRepetitions2DEpilogue
static constexpr index_t kGemm1SingleRepN =
Policy::template GetKVBlockGemmSingleRepN<Problem>();
@@ -318,11 +315,6 @@ struct HstuAttentionNoSoftmaxFwdPipelineQRKSVSTrLoad
return make_null_tile_window(make_tuple(number<1>{}, number<1>{}));
}();
using q_tile_type = decltype(make_static_distributed_tensor<QKVDataType>(
Policy::template MakeQRegTileDistribution<Problem>()));
q_tile_type q_tile;
store_tile(q_lds_write_window, q_dram_tile);
clear_tile(o_acc);
@@ -331,7 +323,7 @@ struct HstuAttentionNoSoftmaxFwdPipelineQRKSVSTrLoad
block_sync_lds();
q_tile = load_tile(q_lds_read_window);
auto q_tile = load_tile(q_lds_read_window);
q_tile = tile_elementwise_in(q_element_func, q_tile);

View File

@@ -70,9 +70,6 @@ struct HstuAttentionWithSoftmaxFwdPipelineQRKSVSTrLoad
static constexpr index_t kAlignmentBias =
kPadSeqLenK ? 1 : Policy::template GetAlignmentBias<Problem>();
static constexpr index_t kGemmSingleRepM = Policy::template GetQKBlockGemmSingleRepM<Problem>();
static constexpr index_t kGemmNumRepM = kM0 / kGemmSingleRepM;
// used by NRepetitions2DEpilogue
static constexpr index_t kGemm1SingleRepN =
Policy::template GetKVBlockGemmSingleRepN<Problem>();
@@ -332,11 +329,6 @@ struct HstuAttentionWithSoftmaxFwdPipelineQRKSVSTrLoad
return make_null_tile_window(make_tuple(number<1>{}, number<1>{}));
}();
using q_tile_type = decltype(make_static_distributed_tensor<QKVDataType>(
Policy::template MakeQRegTileDistribution<Problem>()));
q_tile_type q_tile;
store_tile(q_lds_write_window, q_dram_tile);
clear_tile(o_acc);
@@ -345,7 +337,7 @@ struct HstuAttentionWithSoftmaxFwdPipelineQRKSVSTrLoad
block_sync_lds();
q_tile = load_tile(q_lds_read_window);
auto q_tile = load_tile(q_lds_read_window);
q_tile = tile_elementwise_in(q_element_func, q_tile);