mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-20 06:49:15 +00:00
[CK_TILE]fix elementwise example in gfx11/12 (#2676)
* fix elementwise examples * improve the robust * fix ck_tile's elementwise test * update elementwise test
This commit is contained in:
@@ -14,13 +14,14 @@ struct ElementWiseShape
|
||||
|
||||
static constexpr index_t kWarpM = WarpTile::at(number<0>{});
|
||||
|
||||
static constexpr index_t kVectorM = 16 / sizeof(ComputeDataType);
|
||||
static constexpr index_t kVectorM =
|
||||
min(static_cast<index_t>(16 / sizeof(ComputeDataType)), kWarpM / get_warp_size());
|
||||
|
||||
static constexpr index_t kWarpPerBlockM = BlockWarps::at(number<0>{});
|
||||
|
||||
static constexpr index_t kThreadPerWarpM = kWarpM / kVectorM;
|
||||
static constexpr index_t kThreadPerWarpM = get_warp_size();
|
||||
|
||||
static constexpr index_t kRepeatM = kBlockM / (kWarpPerBlockM * kWarpM);
|
||||
static constexpr index_t kRepeatM = kBlockM / (kWarpPerBlockM * kVectorM * kThreadPerWarpM);
|
||||
|
||||
static constexpr index_t kBlockSize =
|
||||
ck_tile::get_warp_size() * reduce_on_sequence(BlockWarps{}, multiplies{}, number<1>{});
|
||||
|
||||
Reference in New Issue
Block a user