mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-17 19:40:04 +00:00
Merge commit 'f3e4d46faa5f3ce4d81c86121782d8a9aea27c5e' into develop
This commit is contained in:
@@ -11,19 +11,33 @@ namespace instance {
|
||||
|
||||
// Compilation parameters for in[n, hi, wi, g, c] * wei[g, k, y, x, c] = out[n, ho, wo, g, k]
|
||||
void add_device_grouped_conv3d_bwd_weight_wmma_bilinear_ndhwgc_gkzyxc_ndhwgk_f16_instances(
|
||||
std::vector<std::unique_ptr<DeviceGroupedConvBwdWeightMultipleD<3,
|
||||
NDHWGC,
|
||||
GKZYXC,
|
||||
NDHWGK,
|
||||
Tuple<GKZYXC>,
|
||||
F16,
|
||||
F16,
|
||||
F16,
|
||||
Tuple<F16>,
|
||||
PassThrough,
|
||||
Bilinear,
|
||||
PassThrough>>>& instances)
|
||||
[[maybe_unused]] std::vector<std::unique_ptr<DeviceGroupedConvBwdWeightMultipleD<3,
|
||||
NDHWGC,
|
||||
GKZYXC,
|
||||
NDHWGK,
|
||||
Tuple<GKZYXC>,
|
||||
F16,
|
||||
F16,
|
||||
F16,
|
||||
Tuple<F16>,
|
||||
PassThrough,
|
||||
Bilinear,
|
||||
PassThrough>>>&
|
||||
instances)
|
||||
{
|
||||
// One of the kernels in this code block fails to compile, but only on Windows when building for
|
||||
// gfx1101. It succeeds on Linux for all gfx110X series GPU's, and on Windows for other gfx110X
|
||||
// series GPU's.
|
||||
// TODO: Remove this ifdef combo disabling these kernels once we have followed up with the
|
||||
// compiler team and they are able to be built again. This is the compilation error that
|
||||
// results:
|
||||
//
|
||||
// error: Illegal instruction detected: Operand has incorrect register class.
|
||||
// V_CMP_NE_U32_e32 0, $src_private_base, implicit-def $vcc, implicit $exec
|
||||
// Compiler version info:
|
||||
// AMD clang version 22.0.0git (https://github.com/ROCm/llvm-project.git
|
||||
// 8e85e3138dd485c4221cc12aff9eb60ab48ed3b5+PATCHED:93c451b46cc0dc23c47d67e394b370de65731aac)
|
||||
#if !defined(_WIN32)
|
||||
// 1. Default
|
||||
add_device_operation_instances(
|
||||
instances,
|
||||
@@ -42,6 +56,7 @@ void add_device_grouped_conv3d_bwd_weight_wmma_bilinear_ndhwgc_gkzyxc_ndhwgk_f16
|
||||
GKZYXC,
|
||||
NDHWGK,
|
||||
ConvBwdWeightFilter1x1Stride1Pad0>{});
|
||||
#endif
|
||||
}
|
||||
|
||||
} // namespace instance
|
||||
|
||||
Reference in New Issue
Block a user