mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-14 10:09:41 +00:00
* tweak conv for odd C
* update script
* clean up elementwise op
* fix build
* clean up
* added example for gemm+bias+relu+add
* added example for gemm+bias+relu
* add profiler for gemm_s_shuffle; re-org files
* add profiler
* fix build
* clean up
* clean up
* clean up
* fix build
[ROCm/composable_kernel commit: 823657ed12]
21 lines
770 B
Bash
Executable File
21 lines
770 B
Bash
Executable File
#!/bin/bash
|
|
|
|
## GPU visibility
|
|
export HIP_VISIBLE_DEVICES=0
|
|
|
|
make -j $1
|
|
|
|
DRIVER=example/$1
|
|
VERIFY=$2
|
|
INIT=$3
|
|
REPEAT=$4
|
|
|
|
######## verify init repeat M___ N___ K___ StrideA StrideB StrideC StrideC1
|
|
#$DRIVER $VERIFY $INIT $REPEAT 256 256 256 256 256 256 256
|
|
#$DRIVER $VERIFY $INIT $REPEAT 960 1024 1024 1024 1024 1024 1024
|
|
#$DRIVER $VERIFY $INIT $REPEAT 1920 2048 2048 2048 2048 2048 2048
|
|
$DRIVER $VERIFY $INIT $REPEAT 3840 4096 4096 4096 4096 4096 4096
|
|
#$DRIVER $VERIFY $INIT $REPEAT 7680 8192 8192 8192 8192 8192 8192
|
|
#$DRIVER $VERIFY $INIT $REPEAT 1024 1024 1024 1024 1024 1024 1024
|
|
#$DRIVER $VERIFY $INIT $REPEAT 2048 2048 2048 2048 2048 2048 2048
|