mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 14:29:05 +00:00
* Finished adding the performance benchmark for ck tile gemm * Fix the executable rename problem * fix the executable name error * delete the unsupported layout combinations * Update run_full_test.sh * Update benchmark_mem_pipeline.sh * Update benchmark_basic.sh * change the executable of gemm_universal * change ck_tile_gemm script permissions * Addressed the comment * Addressed the comment * Fixed the comments * Fixed Comment * roll back the malfunctioned change * Fix the Typo * finalize the tile_gemm_fp16 performance monitoring * fix the stash names for ck_tile gemm logs * change the stashing logic * change stashing syntax --------- Co-authored-by: Illia Silin <98187287+illsilin@users.noreply.github.com> Co-authored-by: illsilin <Illia.Silin@amd.com>
62 lines
1.9 KiB
Bash
Executable File
62 lines
1.9 KiB
Bash
Executable File
#!/bin/bash
|
|
#
|
|
# in order to run this script you'd need the following python packages:
|
|
|
|
#pip3 install --upgrade pip
|
|
#pip3 install sqlalchemy pymysql pandas sshtunnel
|
|
|
|
# you would also need to set up some environment variables in order to
|
|
# post your new test results to the database and compare them to the baseline
|
|
# please contact Illia.Silin@amd.com for more details
|
|
|
|
#process results
|
|
python3 process_perf_data.py perf_gemm.log
|
|
python3 process_perf_data.py perf_onnx_gemm.log
|
|
python3 process_perf_data.py perf_resnet50_N256.log
|
|
python3 process_perf_data.py perf_resnet50_N4.log
|
|
|
|
file=./perf_onnx_gemm_gfx10.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx10.log
|
|
fi
|
|
file=./perf_onnx_gemm_gfx11.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx11.log
|
|
fi
|
|
file=./perf_onnx_gemm_gfx12.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx12.log
|
|
fi
|
|
file=./perf_fmha_fwd_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_fwd_gfx942.log
|
|
fi
|
|
file=./perf_fmha_bwd_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_bwd_gfx942.log
|
|
fi
|
|
file=./perf_fmha_fwd_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_fwd_gfx90a.log
|
|
fi
|
|
file=./perf_fmha_bwd_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_bwd_gfx90a.log
|
|
fi
|
|
file=./perf_tile_gemm_basic_fp16_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_tile_gemm_basic_fp16_gfx942.log
|
|
fi
|
|
file=./perf_tile_gemm_basic_fp16_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_tile_gemm_basic_fp16_gfx90a.log
|
|
fi
|
|
file=./perf_tile_gemm_mem_pipeline_fp16_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_tile_gemm_mem_pipeline_fp16_gfx942.log
|
|
fi
|
|
file=./perf_tile_gemm_mem_pipeline_fp16_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_tile_gemm_mem_pipeline_fp16_gfx90a.log
|
|
fi
|