mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 22:39:03 +00:00
[ck_tile] Pooling example - Improved tile sizes (#3233)
* improved tile sizes - modified tile sizes for improved example performance * Update example/ck_tile/36_pooling/pool3d.cpp Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com> --------- Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com>
This commit is contained in:
committed by
GitHub
parent
ad57f6ef0b
commit
1eb26460aa
@@ -31,8 +31,8 @@ auto create_args(int argc, char* argv[])
|
||||
.insert("RightPy", "1", "right padding h")
|
||||
.insert("RightPx", "1", "right padding w")
|
||||
.insert("v", "1", "cpu validation or not")
|
||||
.insert("warmup", "0", "cold iter")
|
||||
.insert("repeat", "1", "hot iter");
|
||||
.insert("warmup", "20", "cold iter")
|
||||
.insert("repeat", "100", "hot iter");
|
||||
|
||||
bool result = arg_parser.parse(argc, argv);
|
||||
return std::make_tuple(result, arg_parser);
|
||||
@@ -120,10 +120,10 @@ bool run(const ck_tile::ArgParser& arg_parser)
|
||||
in_buf.ToDevice(in.data());
|
||||
|
||||
using ReduceOp = ck_tile::ReduceOp::Max;
|
||||
using BlockWarps = ck_tile::sequence<4, 1>;
|
||||
using BlockTile = ck_tile::sequence<128, 128>;
|
||||
using WarpTile = ck_tile::sequence<32, 128>;
|
||||
using ThreadTile = ck_tile::sequence<8, 8>;
|
||||
using BlockWarps = ck_tile::sequence<1, 1>;
|
||||
using BlockTile = ck_tile::sequence<128, 1>;
|
||||
using WarpTile = ck_tile::sequence<128, 1>;
|
||||
using ThreadTile = ck_tile::sequence<2, 1>;
|
||||
|
||||
using Shape = ck_tile::PoolShape<BlockWarps, BlockTile, WarpTile, ThreadTile>;
|
||||
using Problem = ck_tile::PoolProblem<InDataType,
|
||||
|
||||
Reference in New Issue
Block a user