mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-06-08 23:38:11 +00:00
Fix packing
This commit is contained in:
@@ -497,11 +497,11 @@ __global__ void test_mx_f32x32_device_scaled_convert(float* p_test, uint64_t* p_
|
||||
f4x32_t f4x32{};
|
||||
float32_t float32{};
|
||||
ck::static_for<0, N / 2, 1>{}([&](auto ii) {
|
||||
f4x32.AsType<f4x2_pk_t>()(ck::Number<ii>{})
|
||||
.pack(type_convert<f4_t>(vec32_generator(2 * ii, type_convert<float>(scale2)) /
|
||||
type_convert<float>(scale2)),
|
||||
type_convert<f4_t>(vec32_generator(2 * ii + 1, type_convert<float>(scale2)) /
|
||||
type_convert<float>(scale2)));
|
||||
f4x32.AsType<f4x2_pk_t>()(ck::Number<ii>{}) = f4x2_pk_t{}.pack(
|
||||
type_convert<f4_t>(vec32_generator(2 * ii, type_convert<float>(scale2)) /
|
||||
type_convert<float>(scale2)),
|
||||
type_convert<f4_t>(vec32_generator(2 * ii + 1, type_convert<float>(scale2)) /
|
||||
type_convert<float>(scale2)));
|
||||
});
|
||||
|
||||
float32 = scaled_type_convert<float32_t>(scale2, f4x32);
|
||||
@@ -532,8 +532,7 @@ TEST(MXFP4, DeviceF4x32ToF32x32ScaledConvert)
|
||||
auto scale2 = e8m0_bexp_t(2.0f);
|
||||
|
||||
ck::static_for<0, N, 1>{}([&](auto ii) {
|
||||
EXPECT_EQ(out[i++],
|
||||
vec32_generator(ii, type_convert<float>(scale2)) / type_convert<float>(scale2))
|
||||
EXPECT_EQ(out[i++], vec32_generator(ii, type_convert<float>(scale2)))
|
||||
<< "ii: " << ii << std::endl;
|
||||
});
|
||||
|
||||
|
||||
Reference in New Issue
Block a user