use old ctile to avoid conv2d fwd bias relu add compute error (#271)

This commit is contained in:
Shaojie WANG
2022-06-03 03:06:42 +08:00
committed by GitHub
parent 86185bd7ce
commit 1c5d06f270
3 changed files with 13 additions and 20 deletions

View File

@@ -340,7 +340,7 @@ struct GridwiseGemm_k0mk1_k0nk1_mn_xdlops_v3r3
using DefaultBlock2CTileMap =
remove_cvref_t<decltype(MakeDefaultBlock2CTileMap(CGridDesc_M_N{}, 1, 1))>;
template <bool HasMainKBlockLoop, typename Block2CTileMap = DefaultBlock2CTileMap>
template <bool HasMainKBlockLoop, typename Block2CTileMap>
__device__ static void
Run(const FloatAB* __restrict__ p_a_grid,
const FloatAB* __restrict__ p_b_grid,