[CK_TILE] Patch for pk_fp4 ref check and buffer load. (#3044)

* Patch for pk_fp4_raw_t buffer load and ref check
This commit is contained in:
Gino Lu
2025-10-20 14:47:04 +08:00
committed by GitHub
parent af3786fe08
commit fb1d090f3c
2 changed files with 54 additions and 0 deletions

View File

@@ -1405,6 +1405,8 @@ CK_TILE_DEVICE thread_buffer<T, N> amd_buffer_load_impl(int32x4_t src_wave_buffe
(std::is_same<T, fp8_t>::value && (N == 1 || N == 2 || N == 4 || N == 8 || N == 16)) ||
(std::is_same<T, bf8_t>::value && (N == 1 || N == 2 || N == 4 || N == 8 || N == 16)) ||
(std::is_same<T, int8_t>::value && (N == 1 || N == 2 || N == 4 || N == 8 || N == 16)) ||
(std::is_same<T, pk_fp4_raw_t>::value &&
(N == 1 || N == 2 || N == 4 || N == 8 || N == 16)) ||
(std::is_same<T, pk_int4_t>::value &&
(N == 1 || N == 2 || N == 4 || N == 8 || N == 16 || N == 32)),
"wrong! not implemented");