mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-04 21:51:28 +00:00
* update the performance test logic * fix unstash perf logs logic * untangle unstashing fmha logs for different archs * run process stage after running fmha tests * fix the processing of perf logs * fix arguments for run_performance scripts
84 lines
2.4 KiB
Bash
Executable File
84 lines
2.4 KiB
Bash
Executable File
#!/bin/bash
|
|
#
|
|
# in order to run this script you'd need the following python packages:
|
|
|
|
#pip3 install --upgrade pip
|
|
#pip3 install sqlalchemy pymysql pandas sshtunnel
|
|
|
|
# you would also need to set up some environment variables in order to
|
|
# post your new test results to the database and compare them to the baseline
|
|
# please contact Illia.Silin@amd.com for more details
|
|
|
|
#process results
|
|
file=./perf_gemm_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_gemm_gfx90a.log
|
|
fi
|
|
file=./perf_onnx_gemm_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx90a.log
|
|
fi
|
|
file=./perf_resnet50_N256_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_resnet50_N256_gfx90a.log
|
|
fi
|
|
file=./perf_resnet50_N4_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_resnet50_N4_gfx90a.log
|
|
fi
|
|
|
|
file=./perf_gemm_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_gemm_gfx942.log
|
|
fi
|
|
file=./perf_onnx_gemm_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx942.log
|
|
fi
|
|
file=./perf_resnet50_N256_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_resnet50_N256_gfx942.log
|
|
fi
|
|
file=./perf_resnet50_N4_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_resnet50_N4_gfx942.log
|
|
fi
|
|
|
|
file=./perf_onnx_gemm_gfx10.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx10.log
|
|
fi
|
|
file=./perf_onnx_gemm_gfx11.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx11.log
|
|
fi
|
|
file=./perf_onnx_gemm_gfx12.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx12.log
|
|
fi
|
|
file=./perf_fmha_fwd_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_fwd_gfx942.log
|
|
fi
|
|
file=./perf_fmha_bwd_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_bwd_gfx942.log
|
|
fi
|
|
file=./perf_fmha_fwd_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_fwd_gfx90a.log
|
|
fi
|
|
file=./perf_fmha_bwd_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_bwd_gfx90a.log
|
|
fi
|
|
|
|
for gpu in "gfx90a" "gfx942"; do
|
|
for dtype in "fp16" "bf16" "fp8" "bf8"; do
|
|
file=./perf_tile_gemm_mem_pipeline_${dtype}_${gpu}.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_tile_gemm_mem_pipeline_${dtype}_${gpu}.log
|
|
fi
|
|
done
|
|
done
|