added lds doubl buffer for implicit gemm v4 (nchw, kcyx)

[ROCm/composable_kernel commit: ad5db169b6]
This commit is contained in:
Chao Liu
2019-05-30 20:55:21 -05:00
parent be1b3be83d
commit 3e7d31c326
3 changed files with 428 additions and 4 deletions

View File

@@ -455,10 +455,10 @@ int main(int argc, char* argv[])
constexpr index_t HPad = 0;
constexpr index_t WPad = 0;
#elif 0
#elif 1
// 1x1 filter, 28x28 image
constexpr index_t N = 16;
constexpr index_t C = 256;
constexpr index_t N = 128;
constexpr index_t C = 512;
constexpr index_t HI = 28;
constexpr index_t WI = 28;
constexpr index_t K = 512;