This commit is contained in:
coderfeli
2025-08-06 02:06:13 +00:00
parent 080bfd881a
commit cd45fe941d
5 changed files with 69 additions and 138 deletions

View File

@@ -33,17 +33,6 @@ float flatmm_calc(const ck_tile::FlatmmHostArgs<>& args, const ck_tile::stream_c
ck_tile::sequence<FlatmmConfig::M_Warp_Tile,
FlatmmConfig::N_Warp_Tile,
FlatmmConfig::K_Warp_Tile>>;
// static constexpr index_t kM = BlockTile::at(number<0>{});
// static constexpr index_t kN = BlockTile::at(number<1>{});
// static constexpr index_t kK = BlockTile::at(number<2>{});
// static constexpr bool PermuteA = PermuteA_;
// static constexpr bool PermuteB = PermuteB_;
// static constexpr index_t flatNPerWarp = BlockWarps::at(number<1>{}); // 4
// static constexpr index_t flatKPerWarp = WarpTile::at(number<2>{}) * WarpTile::at(number<1>{});// 16 * 64
// static constexpr index_t flatKPerBlock = flatKPerWarp * kK / WarpTile::at(number<2>{}); // 16 * 128
using TilePartitioner =
ck_tile::GemmSpatiallyLocalTilePartitioner<CodegenFlatmmShape,
FlatmmConfig::TileParitionerGroupNum,