diff --git a/src/include/common.hip.hpp b/src/include/common.hip.hpp index fc0d7d8bc3..6b8c450021 100644 --- a/src/include/common.hip.hpp +++ b/src/include/common.hip.hpp @@ -62,10 +62,9 @@ __host__ __device__ constexpr T min(T x, Ts... xs) return x < y ? x : y; } -}// namespace mod_conv +} // namespace mod_conv #if DEVICE_BACKEND_HIP // cast a pointer of LDS to its address extern "C" __attribute__((address_space(3))) void* __to_local(void* p)[[hc]]; #endif - diff --git a/src/include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hip.hpp b/src/include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hip.hpp index a95363fa60..e04b1752ea 100644 --- a/src/include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hip.hpp +++ b/src/include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn.hip.hpp @@ -287,10 +287,10 @@ struct GridwiseConvolutionImplicitGemm_v2_chwn_cyxk_khwn #elif 0 blockwise_gemm.Run_asm #endif - (p_wei_block + wei_cyxk_block_desc.Get1dIndex(0, y, x, 0), - p_in_block + y * Wi + x, - p_out_thread, - f_accum); + (p_wei_block + wei_cyxk_block_desc.Get1dIndex(0, y, x, 0), + p_in_block + y * Wi + x, + p_out_thread, + f_accum); } } } diff --git a/src/include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hip.hpp b/src/include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hip.hpp index a731964bc6..b68b73a6ad 100644 --- a/src/include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hip.hpp +++ b/src/include/gridwise_convolution_implicit_gemm_v2_chwn_cyxk_khwn_lds_double_buffer.hip.hpp @@ -36,11 +36,14 @@ template struct GridwiseConvolutionImplicitGemm_v2_chwn_cyxk_khwn_lds_double_buffer { - __host__ __device__ constexpr GridwiseConvolutionImplicitGemm_v2_chwn_cyxk_khwn_lds_double_buffer() {} + __host__ + __device__ constexpr GridwiseConvolutionImplicitGemm_v2_chwn_cyxk_khwn_lds_double_buffer() + { + } __device__ void Run(const Float* const __restrict__ p_in_global, - const Float* const __restrict__ p_wei_global, - Float* const __restrict__ p_out_global) const + const Float* const __restrict__ p_wei_global, + Float* const __restrict__ p_out_global) const { constexpr auto I0 = Number<0>{}; constexpr auto I1 = Number<1>{};