diff --git a/example/ck_tile/01_fmha/script/smoke_test_bwd_v3.sh b/example/ck_tile/01_fmha/script/smoke_test_bwd_v3.sh index 95054ae7ee..1b853f6d1f 100644 --- a/example/ck_tile/01_fmha/script/smoke_test_bwd_v3.sh +++ b/example/ck_tile/01_fmha/script/smoke_test_bwd_v3.sh @@ -10,16 +10,18 @@ COMMON_ARGS='-v=1' set -x for prec in "fp16" "bf16" ; do for perm in 0 1 ; do -for hdim in 128 ; do +for hdim in 64 72 96 128 ; do for v3_atomic_fp32 in 0 1 ; do +for v3_bf16_cvt in 0 1 2 ; do for mask in 0 1 ; do -$EXE -prec=$prec -b=4 -h=2 -d=$hdim -s=512 -iperm=$perm -operm=$perm -mask=$mask -bwd_v3=1 -v3_atomic_fp32=$v3_atomic_fp32 -mode=0 -kname=$KNAME $COMMON_ARGS -$EXE -prec=$prec -b=1 -h=3 -d=$hdim -s=768 -iperm=$perm -operm=$perm -mask=$mask -bwd_v3=1 -v3_atomic_fp32=$v3_atomic_fp32 -mode=0 -kname=$KNAME $COMMON_ARGS +$EXE -prec=$prec -b=2 -h=4 -h_k=2 -d=$hdim -s=512 -iperm=$perm -operm=$perm -mask=$mask -bwd_v3=1 -v3_atomic_fp32=$v3_atomic_fp32 -v3_bf16_cvt=$v3_bf16_cvt -mode=0 -kname=$KNAME $COMMON_ARGS +$EXE -prec=$prec -b=1 -h=3 -h_k=1 -d=$hdim -s=768 -iperm=$perm -operm=$perm -mask=$mask -bwd_v3=1 -v3_atomic_fp32=$v3_atomic_fp32 -v3_bf16_cvt=$v3_bf16_cvt -mode=0 -kname=$KNAME $COMMON_ARGS done done done done done +done set +x diff --git a/example/ck_tile/01_fmha/script/smoke_test_bwd_v3_xqa.sh b/example/ck_tile/01_fmha/script/smoke_test_bwd_v3_xqa.sh deleted file mode 100644 index 846d218cc4..0000000000 --- a/example/ck_tile/01_fmha/script/smoke_test_bwd_v3_xqa.sh +++ /dev/null @@ -1,27 +0,0 @@ -#!/bin/sh -# TODO: run this script from CK root or build directory -EXE="$(find . -name tile_example_fmha_bwd -type f | head -n 1)" -KNAME=1 - -export CK_WARMUP=0 -export CK_REPEAT=1 - -COMMON_ARGS='-v=1' -set -x -for prec in "fp16" "bf16" ; do -for perm in 0 1 ; do -for hdim in 72 96 128 ; do -for v3_atomic_fp32 in 0 1 ; do -for v3_bf16_cvt in 0 1 2 ; do -for mask in 0 1 ; do - -$EXE -prec=$prec -b=2 -h=4 -h_k=2 -d=$hdim -s=512 -iperm=$perm -operm=$perm -mask=$mask -bwd_v3=1 -v3_atomic_fp32=$v3_atomic_fp32 -v3_bf16_cvt=$v3_bf16_cvt -mode=0 -kname=$KNAME $COMMON_ARGS -$EXE -prec=$prec -b=1 -h=3 -h_k=1 -d=$hdim -s=768 -iperm=$perm -operm=$perm -mask=$mask -bwd_v3=1 -v3_atomic_fp32=$v3_atomic_fp32 -v3_bf16_cvt=$v3_bf16_cvt -mode=0 -kname=$KNAME $COMMON_ARGS - -done -done -done -done -done -done -set +x