Merge commit 'b26cb596b0cbea9f40ae36b3f245b5aa7120c5c9' into develop

This commit is contained in:
assistant-librarian[bot]
2026-01-27 18:19:38 +00:00
parent 21657a1f32
commit 417ad9c7f1
2 changed files with 5 additions and 5 deletions

View File

@@ -1242,7 +1242,7 @@ inline __host__ __device__ float2_t type_convert<float2_t, pk_i4_t>(pk_i4_t x)
#ifdef CK_USE_PK4_LAYOUT_SHUFFLE
float2_t res = {x_h, x_l};
#elif
#else
float2_t res = {x_l, x_h};
#endif
return res;

View File

@@ -111,7 +111,7 @@ CK_TILE_HOST_DEVICE fp32x2_t pk_int4_t_to_fp32x2_t(const pk_int4_t& x)
#ifdef CK_TILE_USE_PK4_LAYOUT_SHUFFLE
fp32x2_t res = {x_h, x_l};
#elif
#else
fp32x2_t res = {x_l, x_h};
#endif
return res;
@@ -129,7 +129,7 @@ CK_TILE_HOST_DEVICE fp32x2_t pk_int4_t_to_fp32x2_t_signed_conversion(const pk_in
#ifdef CK_TILE_USE_PK4_LAYOUT_SHUFFLE
fp32x2_t res = {x_h, x_l};
#elif
#else
fp32x2_t res = {x_l, x_h};
#endif
return res;
@@ -140,7 +140,7 @@ CK_TILE_HOST_DEVICE fp16x2_t pk_int4_t_to_halfx2_t(const pk_int4_t& x)
uint8_t x_u8 = ck_tile::bit_cast<uint8_t>(x);
#ifdef CK_TILE_USE_PK4_LAYOUT_SHUFFLE
uint32_t i4s = ((x_u8 & 0x0f) << 16) | ((x_u8 & 0xf0) >> 4);
#elif
#else
uint32_t i4s = ((x_u8 & 0xf0) << 12) | (x_u8 & 0xf);
#endif
const int EX = 0x64006400;
@@ -160,7 +160,7 @@ CK_TILE_HOST_DEVICE bf16x2_t pk_int4_t_to_bfloat16x2_t(const pk_int4_t& x)
#ifdef CK_TILE_USE_PK4_LAYOUT_SHUFFLE
bf16x2_t res = {type_convert<bf16_t>(x_h), type_convert<bf16_t>(x_l)};
#elif
#else
bf16x2_t res = {type_convert<bf16_t>(x_l), type_convert<bf16_t>(x_h)};
#endif
return res;