Disable DL kernels on all architectures except gfx103x. (#3218)

* disable dl kernels on all archs except gfx103

* add gfx10-3-generic target to cmake
This commit is contained in:
Illia Silin
2025-11-14 17:39:50 -08:00
committed by GitHub
parent 0aadb4b2c4
commit b38bb492a1
2 changed files with 3 additions and 3 deletions

View File

@@ -86,7 +86,7 @@ inline __device__ f8x8_t amd_assembly_i4_to_fp8x8(int a)
return bit_cast<f8x8_t>(((static_cast<uint64_t>(fp8x4_1) << 32) | fp8x4_0));
}
#ifdef DL_KERNELS
// c0 += inner_product(a, b0)
// c1 += inner_product(a, b1)
__device__ void amd_assembly_outer_product_1x2(float a, float b0, float b1, float& c0, float& c1)
@@ -430,6 +430,6 @@ __device__ void amd_assembly_outer_product_1x4(int8x16_t a,
c2,
c3);
}
#endif
} // namespace ck
#endif