mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-18 03:49:41 +00:00
Padding support for wave transfer (#3537)
* Add padding support with transpose
Also move check before writing storing is_src_valid during reading
* Add/modify instances to use wave transfer for gemm universal
Condition is changed so now the vectorsize of vmem reading and lds
writing must be equal to 8 in order to use the wave transfer
* Fix clang format
* Modify example
* Fix bwd data
* Add restriction for wave transfer with padding and transpose
Add test case which shows this limitation
* Fix validity checks 8 bit types
* Add validity check gemm_bias_add_reduce
* Add validity check grouped gemm tile loop
* Fix validity checks new flavours
* Minor fixes
* Fix clang format
[ROCm/composable_kernel commit: 2e49b6b2f7]
This commit is contained in:
@@ -125,7 +125,7 @@ TYPED_TEST(TestGemmUniversal_FP16_KM_NK, MidLargeM)
|
||||
|
||||
TYPED_TEST(TestGemmUniversal_FP16_MK_KN, PaddK)
|
||||
{
|
||||
std::vector<int> Ms{127};
|
||||
std::vector<int> Ms{127, 128};
|
||||
constexpr int N = 512;
|
||||
constexpr int K = 437;
|
||||
|
||||
@@ -139,7 +139,7 @@ TYPED_TEST(TestGemmUniversal_FP16_MK_KN, PaddK)
|
||||
|
||||
TYPED_TEST(TestGemmUniversal_FP16_MK_NK, PaddK)
|
||||
{
|
||||
std::vector<int> Ms{127};
|
||||
std::vector<int> Ms{127, 128};
|
||||
constexpr int N = 512;
|
||||
constexpr int K = 437;
|
||||
|
||||
@@ -153,7 +153,7 @@ TYPED_TEST(TestGemmUniversal_FP16_MK_NK, PaddK)
|
||||
|
||||
TYPED_TEST(TestGemmUniversal_FP16_KM_KN, PaddK)
|
||||
{
|
||||
std::vector<int> Ms{127};
|
||||
std::vector<int> Ms{127, 128};
|
||||
constexpr int N = 512;
|
||||
constexpr int K = 437;
|
||||
|
||||
@@ -169,7 +169,7 @@ TYPED_TEST(TestGemmUniversal_FP16_KM_KN, PaddK)
|
||||
|
||||
TYPED_TEST(TestGemmUniversal_FP16_KM_NK, PaddK)
|
||||
{
|
||||
std::vector<int> Ms{127};
|
||||
std::vector<int> Ms{127, 128};
|
||||
constexpr int N = 512;
|
||||
constexpr int K = 437;
|
||||
|
||||
|
||||
Reference in New Issue
Block a user