diff --git a/example/ck_tile/18_hstu_attention/hstu_attention_pipeline_problem.hpp b/example/ck_tile/18_hstu_attention/hstu_attention_pipeline_problem.hpp index ac09975aa5..886bb29c1c 100644 --- a/example/ck_tile/18_hstu_attention/hstu_attention_pipeline_problem.hpp +++ b/example/ck_tile/18_hstu_attention/hstu_attention_pipeline_problem.hpp @@ -60,10 +60,11 @@ struct HstuAttentionFwdPipelineProblem { if constexpr(std::is_same_v || std::is_same_v) { + // ToDo: need support in ck_tile for using buffer_load_dwordx3 + // if constexpr(ElemPerThread % 6 == 0) + // return 6; if constexpr(ElemPerThread % 8 == 0) return 8; - else if constexpr(ElemPerThread % 6 == 0) - return 6; else if constexpr(ElemPerThread % 4 == 0) return 4; else if constexpr(ElemPerThread % 2 == 0) @@ -72,10 +73,11 @@ struct HstuAttentionFwdPipelineProblem } else if constexpr(std::is_same_v) { + // ToDo: need support in ck_tile for using buffer_load_dwordx3 + // if constexpr(ElemPerThread % 3 == 0) + // return 3; if constexpr(ElemPerThread % 4 == 0) return 4; - else if constexpr(ElemPerThread % 3 == 0) - return 3; else if constexpr(ElemPerThread % 2 == 0) return 2; return 1;