mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-02 20:51:23 +00:00
Support Wave32 in CK_TILE - Part 1 (#2594)
* Support wave32/wave64 in CK_TILE - Part 1 * remove blocksize in kernel launch * fix build error * fix clang format * fix clang format 2 * fix clang format 3 * fix fmha build error * fix fmha build 2 * fix fmha build 3 * fix build error 4 * address review comment * update change log * replace KernelBlockSize with kBlockSize * fix CI fail * fix clang format * address review comment and rebase code. * fix universal test fail --------- Co-authored-by: Lin, Qun <Quentin.Lin+amdeng@amd.com> Co-authored-by: Thomas Ning <Thomas.Ning@amd.com>
This commit is contained in:
@@ -137,11 +137,11 @@ class TestCkTileBatchedTranspose // N C H W layout_in==
|
||||
Config::BlockTile::at(1)};
|
||||
auto kargs = Kernel::MakeKargs(host_args);
|
||||
|
||||
auto sc = ck_tile::stream_config{};
|
||||
const dim3 grid_size = Kernel::GridSize(host_args);
|
||||
constexpr dim3 block_size = Kernel::BlockSize();
|
||||
ck_tile::launch_kernel(
|
||||
sc, ck_tile::make_kernel<block_size.x, 1>(Kernel{}, grid_size, block_size, 0, kargs));
|
||||
auto sc = ck_tile::stream_config{};
|
||||
const dim3 grid_size = Kernel::GridSize(host_args);
|
||||
const dim3 block_size = Kernel::BlockSize();
|
||||
ck_tile::launch_kernel(sc,
|
||||
ck_tile::make_kernel<1>(Kernel{}, grid_size, block_size, 0, kargs));
|
||||
|
||||
y_dev.FromDevice(y_host.data());
|
||||
ck_tile::reference_batched_transpose<DataType>(x_host, y_ref, layout_in, layout_out);
|
||||
|
||||
Reference in New Issue
Block a user