mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-14 18:17:44 +00:00
* Finished adding the performance benchmark for ck tile gemm
* Fix the executable rename problem
* fix the executable name error
* delete the unsupported layout combinations
* Update run_full_test.sh
* Update benchmark_mem_pipeline.sh
* Update benchmark_basic.sh
* change the executable of gemm_universal
* change ck_tile_gemm script permissions
* Addressed the comment
* Addressed the comment
* Fixed the comments
* Fixed Comment
* roll back the malfunctioned change
* Fix the Typo
* finalize the tile_gemm_fp16 performance monitoring
* fix the stash names for ck_tile gemm logs
* change the stashing logic
* change stashing syntax
---------
Co-authored-by: Illia Silin <98187287+illsilin@users.noreply.github.com>
Co-authored-by: illsilin <Illia.Silin@amd.com>
[ROCm/composable_kernel commit: 73a076eee1]
71 lines
2.3 KiB
Bash
Executable File
71 lines
2.3 KiB
Bash
Executable File
#!/bin/bash
|
|
#
|
|
# in order to run this script you'd need the following python packages:
|
|
|
|
#pip3 install --upgrade pip
|
|
#pip3 install sqlalchemy pymysql pandas sshtunnel
|
|
|
|
# you would also need to set up some environment variables in order to
|
|
# post your new test results to the database and compare them to the baseline
|
|
# please contact Illia.Silin@amd.com for more details
|
|
|
|
#process results
|
|
python3 process_perf_data.py perf_gemm.log
|
|
python3 process_perf_data.py perf_resnet50_N256.log
|
|
python3 process_perf_data.py perf_resnet50_N4.log
|
|
python3 process_perf_data.py perf_batched_gemm.log
|
|
python3 process_perf_data.py perf_grouped_gemm.log
|
|
python3 process_perf_data.py perf_grouped_conv_fwd.log
|
|
python3 process_perf_data.py perf_grouped_conv_bwd_data.log
|
|
python3 process_perf_data.py perf_grouped_conv_bwd_weight.log
|
|
python3 process_perf_data.py perf_gemm_bilinear.log
|
|
python3 process_perf_data.py perf_reduction.log
|
|
python3 process_perf_data.py perf_splitK_gemm.log
|
|
python3 process_perf_data.py perf_onnx_gemm.log
|
|
python3 process_perf_data.py perf_mixed_gemm.log
|
|
|
|
file=./perf_onnx_gemm_gfx10.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx10.log
|
|
fi
|
|
file=./perf_onnx_gemm_gfx11.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx11.log
|
|
fi
|
|
file=./perf_onnx_gemm_gfx12.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_onnx_gemm_gfx12.log
|
|
fi
|
|
file=./perf_fmha_fwd_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_fwd_gfx942.log
|
|
fi
|
|
file=./perf_fmha_bwd_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_bwd_gfx942.log
|
|
fi
|
|
file=./perf_fmha_fwd_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_fwd_gfx90a.log
|
|
fi
|
|
file=./perf_fmha_bwd_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_fmha_bwd_gfx90a.log
|
|
fi
|
|
file=./perf_gemm_basic_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_gemm_basic_gfx942.log
|
|
fi
|
|
file=./perf_gemm_basic_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_gemm_basic_gfx90a.log
|
|
fi
|
|
file=./perf_gemm_mem_pipeline_gfx942.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_gemm_mem_pipeline_gfx942.log
|
|
fi
|
|
file=./perf_gemm_mem_pipeline_gfx90a.log
|
|
if [ -e "$file" ]; then
|
|
python3 process_perf_data.py perf_gemm_mem_pipeline_gfx90a.log
|
|
fi
|