mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 22:39:03 +00:00
Tests for CK Tile Batched Transpose and Smoothquant (#2453)
* Create tests for ck tile batched transpose using example * Create ck tile tests for smoothquant using examples * fix precision input strings and convert batched transpose to regression tests * Code cleanup and fix asserts * add missing licenses * update copyright and licensing in files * Update smoothquant tests to use example's smoothquant.cpp * Add custom target for batched transpose tests * Add missing new lines at end of files for CMakelists * fix typo in batched transpose CMakeList target_compile_options --------- Co-authored-by: root <root@ctr-ubbsmc16.amd.com>
This commit is contained in:
143
test/ck_tile/smoothquant/instances/smoothquant_fwd_api.cpp
Normal file
143
test/ck_tile/smoothquant/instances/smoothquant_fwd_api.cpp
Normal file
@@ -0,0 +1,143 @@
|
||||
// Copyright © Advanced Micro Devices, Inc., or its affiliates.
|
||||
// SPDX-License-Identifier: MIT
|
||||
|
||||
#include <ck_tile/core.hpp>
|
||||
#include "smoothquant.hpp"
|
||||
|
||||
template <typename DataType_,
|
||||
ck_tile::index_t Repeat_M_, // each thread repeat along M
|
||||
ck_tile::index_t Repeat_N_, // each thread repeat along N
|
||||
ck_tile::index_t ThreadPerBlock_M_, // num threads along M
|
||||
ck_tile::index_t ThreadPerBlock_N_, // num threads along N
|
||||
ck_tile::index_t Vector_N_, // vector size along N
|
||||
bool kPadN_,
|
||||
bool kTwoPass_>
|
||||
using trait_ = smoothquant_traits_<DataType_,
|
||||
Repeat_M_,
|
||||
Repeat_N_,
|
||||
ThreadPerBlock_M_,
|
||||
ThreadPerBlock_N_,
|
||||
Vector_N_,
|
||||
kPadN_,
|
||||
kTwoPass_>;
|
||||
|
||||
template <typename data_type>
|
||||
float smoothquant_dispatch(smoothquant_traits /*t*/,
|
||||
smoothquant_args a,
|
||||
const ck_tile::stream_config& s)
|
||||
{
|
||||
float r = -1;
|
||||
// clang-format off
|
||||
// rm rn tm tn vn pd 2p
|
||||
if(a.n <= 64) {
|
||||
r = smoothquant_<trait_<data_type, 1, 1, 4, 64, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 128) {
|
||||
if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 1, 4, 64, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 4, 64, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 256) {
|
||||
if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 1, 4, 64, 4, true, false>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 4, 64, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 4, 64, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 512) {
|
||||
if (a.n % 8 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 1, 4, 64, 8, true, false>>(s, a);
|
||||
else if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 4, 64, 4, true, false>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 4, 64, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 8, 4, 64, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 768) {
|
||||
if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 3, 4, 64, 4, true, false>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 6, 4, 64, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1,12, 4, 64, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 1024) {
|
||||
if (a.n % 8 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 1, 2, 128, 8, true, false>>(s, a);
|
||||
else if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 2, 128, 4, true, false>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 2, 128, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 1, 256, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 1536) {
|
||||
if (a.n % 8 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 3, 4, 64, 8, true, false>>(s, a);
|
||||
else if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 3, 2, 128, 4, true, false>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 3, 1, 256, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 6, 1, 256, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 2048) {
|
||||
if (a.n % 8 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 1, 1, 256, 8, true, false>>(s, a);
|
||||
else if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 1, 256, 4, true, false>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 1, 256, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 8, 1, 256, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 3072) {
|
||||
if (a.n % 8 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 3, 1, 128, 8, true, false>>(s, a);
|
||||
else if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 3, 1, 256, 4, true, false>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 6, 1, 256, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 3, 1, 1024, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n <= 4096) {
|
||||
if (a.n % 8 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 1, 256, 8, true, false>>(s, a);
|
||||
else if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 1, 256, 4, true, false>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 1, 1024, 2, true, false>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 1, 1024, 1, true, false>>(s, a);
|
||||
}
|
||||
else if(a.n > 4096) {
|
||||
if (a.n % 8 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 1, 256, 8, true, true>>(s, a);
|
||||
else if (a.n % 4 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 1, 256, 4, true, true>>(s, a);
|
||||
else if (a.n % 2 == 0)
|
||||
r = smoothquant_<trait_<data_type, 1, 2, 1, 1024, 2, true, true>>(s, a);
|
||||
else
|
||||
r = smoothquant_<trait_<data_type, 1, 4, 1, 1024, 1, true, true>>(s, a);
|
||||
}
|
||||
return r;
|
||||
// clang-format on
|
||||
}
|
||||
|
||||
float smoothquant(smoothquant_traits t, smoothquant_args a, const ck_tile::stream_config& s)
|
||||
{
|
||||
if(t.data_type.compare("fp16") == 0)
|
||||
{
|
||||
return smoothquant_dispatch<ck_tile::fp16_t>(t, a, s);
|
||||
}
|
||||
else if(t.data_type.compare("bf16") == 0)
|
||||
{
|
||||
return smoothquant_dispatch<ck_tile::bf16_t>(t, a, s);
|
||||
}
|
||||
else
|
||||
throw std::runtime_error("Without supported instances!");
|
||||
}
|
||||
Reference in New Issue
Block a user