mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-14 10:09:41 +00:00
* fix compile error
* fix typo of padding
* Add smoothquant op
* Add smoothquant instance library
* refine type
* add test script
* Re-generate smoothquant.hpp
* Always use 'current year' in copyright
* use Generic2dBlockShape instead
* Add vector = 8 instance back
* Find exe path automatically
* Simplify the api condition
* Remove debugging code
* update year
* Add blank line between function declaration
* explicitly cast return value to dim3
* refine return value
* Fix default warmup and repeat value
* Add comment
* refactor sommthquant cmake
* Add README
* Fix typo
---------
Co-authored-by: Po Yen, Chen <PoYen.Chen@amd.com>
[ROCm/composable_kernel commit: fbd654545a]
31 lines
966 B
Bash
Executable File
31 lines
966 B
Bash
Executable File
#!/bin/sh
|
|
EXE="$(find . -name tile_smoothquant -type f | head -n 1)"
|
|
|
|
for pr_i in "fp16" "bf16" ; do
|
|
$EXE -prec=$pr_i -m=99 -n=13
|
|
$EXE -prec=$pr_i -m=17 -n=16
|
|
$EXE -prec=$pr_i -m=1 -n=100
|
|
$EXE -prec=$pr_i -m=4 -n=128
|
|
$EXE -prec=$pr_i -m=80 -n=127
|
|
$EXE -prec=$pr_i -m=22 -n=255 -stride=256
|
|
$EXE -prec=$pr_i -m=7 -n=599
|
|
$EXE -prec=$pr_i -m=19 -n=512
|
|
$EXE -prec=$pr_i -m=33 -n=313 -stride=1000
|
|
$EXE -prec=$pr_i -m=11 -n=510
|
|
$EXE -prec=$pr_i -m=171 -n=676 -stride=818
|
|
$EXE -prec=$pr_i -m=91 -n=636
|
|
$EXE -prec=$pr_i -m=12 -n=768 -stride=800
|
|
$EXE -prec=$pr_i -m=100 -n=766 -stride=812
|
|
$EXE -prec=$pr_i -m=31 -n=1024
|
|
$EXE -prec=$pr_i -m=64 -n=1000 -stride=1004
|
|
$EXE -prec=$pr_i -m=8 -n=1501
|
|
$EXE -prec=$pr_i -m=3 -n=1826
|
|
$EXE -prec=$pr_i -m=5 -n=2040
|
|
$EXE -prec=$pr_i -m=7 -n=2734
|
|
$EXE -prec=$pr_i -m=1 -n=3182
|
|
$EXE -prec=$pr_i -m=9 -n=4096
|
|
$EXE -prec=$pr_i -m=3 -n=8192
|
|
$EXE -prec=$pr_i -m=1 -n=10547
|
|
$EXE -prec=$pr_i -m=3 -n=17134
|
|
done
|