more utility code

[ROCm/composable_kernel commit: 7a7fe16086]
This commit is contained in:
Chao Liu
2019-09-09 00:29:33 -05:00
parent b0f3708397
commit 399be319a2
21 changed files with 824 additions and 455 deletions

View File

@@ -115,8 +115,12 @@ void device_convolution_implicit_gemm_v1_chwn_cyxk_khwn_padded(InDesc,
constexpr index_t OutThreadCopyDataPerAccess_N = 4;
#endif
#if 0 // debug
constexpr index_t GridSize =
(N / NPerBlock) * (K / KPerBlock) * (Ho / HoPerBlock) * (Wo / WoPerBlock);
#else
constexpr index_t GridSize = 1;
#endif
printf("%s: BlockSize %u, GridSize %u \n", __func__, BlockSize, GridSize);