mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-15 18:42:06 +00:00
* Finished the feature of gpu verification
* Add the ck_tile_gemm test in the CI CD
* add the include of tensor_layou in reference_gemm
* Comment Addressed
* split ck_tile fhma and gemm tests into separate stages
* restructure the reference gemm
* restructure a new reference_gemm api that could read the device mem
---------
Co-authored-by: carlushuang <carlus.huang@amd.com>
Co-authored-by: illsilin <Illia.Silin@amd.com>
[ROCm/composable_kernel commit: 844f5a1712]
35 lines
949 B
Bash
Executable File
35 lines
949 B
Bash
Executable File
#!/bin/bash
|
|
EXE="$(find . -name tile_example_gemm_basic -type f | head -n 1)"
|
|
KNAME=1
|
|
|
|
export CK_WARMUP=0
|
|
export CK_REPEAT=1
|
|
|
|
COMMON_ARGS='-v=2 -warmup=0 -repeat=1'
|
|
|
|
run_fp16_tests() {
|
|
for batch in 1 2; do
|
|
for m in 128 1024; do
|
|
for n in 128 2048; do
|
|
for k in 32 64; do
|
|
|
|
$EXE -b=$batch -m=$m -n=$n -k=$k -stride_a=0 -stride_b=0 -stride_c=0 -e=1e-5 -prec=fp16 $COMMON_ARGS
|
|
if [ $? -eq 0 ]; then
|
|
echo "Success: Test with batch=$batch, m=$m, n=$n, k=$k executed successfully."
|
|
else
|
|
echo "Error: Test with batch=$batch, m=$m, n=$n, k=$k failed to execute properly."
|
|
# Optionally, exit or break if you need to halt further execution
|
|
# exit 1
|
|
fi
|
|
|
|
done
|
|
done
|
|
done
|
|
done
|
|
}
|
|
|
|
set -x
|
|
|
|
run_fp16_tests
|
|
|
|
set +x |