diff --git a/include/ck_tile/ops/transpose/transpose_policy.hpp b/include/ck_tile/ops/transpose/transpose_policy.hpp index ff65231924..5d65262ca1 100644 --- a/include/ck_tile/ops/transpose/transpose_policy.hpp +++ b/include/ck_tile/ops/transpose/transpose_policy.hpp @@ -105,17 +105,12 @@ struct TransposePolicy template CK_TILE_HOST_DEVICE static constexpr auto MakeOutputDistribution() { - // constexpr index_t BlockSize = Problem::kBlockSize; - // the dimension is reversed after transpose - // constexpr index_t LeadDimPerBlock = Problem::kSecondSizePerBlock; - // constexpr index_t SecondDimPerBlock = Problem::kLeadSizePerBlock; constexpr index_t kSecondIterPerWarp = Problem::kLeadXdlNumPerWarp; constexpr index_t kLeadIterPerWarp = Problem::kSecondXdlNumPerWarp; constexpr index_t kSecondNumWarps = Problem::kLeadNumWarps; constexpr index_t kLeadNumWarps = Problem::kSecondNumWarps; // transpose is based on 64 Bytes - constexpr index_t kLead = - Problem::kSecondSizePerXdl; // Problem::kLeadSizePerXdl; + constexpr index_t kLead = Problem::kSecondSizePerXdl; // Problem::kLeadSizePerXdl; constexpr index_t kSecond = Problem::kLeadSizePerXdl; constexpr index_t kLeadDimstr = kLead / QuartTransposeTraits::kleadDimT; @@ -128,7 +123,7 @@ struct TransposePolicy tile_distribution_encoding, tuple, sequence>, - tuple>, + tuple>, tuple>, sequence<2, 1>, sequence<0, 0>>{}; @@ -137,14 +132,6 @@ struct TransposePolicy constexpr auto block_dstr = make_static_tile_distribution(blk_distr_encode); return block_dstr; - // TODO, fix the tile distribution - // return make_static_tile_distribution( - // tile_distribution_encoding, - // tuple, sequence<4, VecLoadSize>>, - // tuple>, - // tuple>, - // sequence<2>, - // sequence<1>>{}); } template