diff --git a/include/ck/tensor_operation/gpu/device/impl/device_gemm_multiple_d_xdl_cshuffle.hpp b/include/ck/tensor_operation/gpu/device/impl/device_gemm_multiple_d_xdl_cshuffle.hpp index 3b4259cc65..2edb41680b 100644 --- a/include/ck/tensor_operation/gpu/device/impl/device_gemm_multiple_d_xdl_cshuffle.hpp +++ b/include/ck/tensor_operation/gpu/device/impl/device_gemm_multiple_d_xdl_cshuffle.hpp @@ -577,9 +577,7 @@ struct DeviceGemmMultipleD_Xdl_CShuffle : public DeviceGemmMultipleD"; + if (params.back().find("v2") != std::string::npos and K % k_per_block != 0) + str = ""; return Solution{str, block_size, grid_size}; } @@ -156,7 +158,9 @@ std::vector Problem::GetSolutions(const std::string& arch) const const std::size_t num_instances = GetInstances(arch).size(); for(std::size_t i = 0; i < num_instances; ++i) { - solutions.push_back(MakeSolution(i, arch)); + auto solution = MakeSolution(i, arch); + if (solution.template_str != "") + solutions.push_back(solution); } return solutions;