mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-03 05:01:25 +00:00
* Finished the feature of gpu verification * Add the ck_tile_gemm test in the CI CD * add the include of tensor_layou in reference_gemm * Comment Addressed * split ck_tile fhma and gemm tests into separate stages * restructure the reference gemm * restructure a new reference_gemm api that could read the device mem --------- Co-authored-by: carlushuang <carlus.huang@amd.com> Co-authored-by: illsilin <Illia.Silin@amd.com>
35 lines
949 B
Bash
Executable File
35 lines
949 B
Bash
Executable File
#!/bin/bash
|
|
EXE="$(find . -name tile_example_gemm_basic -type f | head -n 1)"
|
|
KNAME=1
|
|
|
|
export CK_WARMUP=0
|
|
export CK_REPEAT=1
|
|
|
|
COMMON_ARGS='-v=2 -warmup=0 -repeat=1'
|
|
|
|
run_fp16_tests() {
|
|
for batch in 1 2; do
|
|
for m in 128 1024; do
|
|
for n in 128 2048; do
|
|
for k in 32 64; do
|
|
|
|
$EXE -b=$batch -m=$m -n=$n -k=$k -stride_a=0 -stride_b=0 -stride_c=0 -e=1e-5 -prec=fp16 $COMMON_ARGS
|
|
if [ $? -eq 0 ]; then
|
|
echo "Success: Test with batch=$batch, m=$m, n=$n, k=$k executed successfully."
|
|
else
|
|
echo "Error: Test with batch=$batch, m=$m, n=$n, k=$k failed to execute properly."
|
|
# Optionally, exit or break if you need to halt further execution
|
|
# exit 1
|
|
fi
|
|
|
|
done
|
|
done
|
|
done
|
|
done
|
|
}
|
|
|
|
set -x
|
|
|
|
run_fp16_tests
|
|
|
|
set +x |