This commit is contained in:
yadaish
2025-12-04 18:47:53 +00:00
parent e37dbc7e49
commit 12d764e999

View File

@@ -206,7 +206,7 @@ struct F16xMXF4FlatmmPipelineAGmemBGmemCRegV1
constexpr int PackedCnt = ScalarCnt / MXFP4PackedSize;
constexpr int float_mantissa = 23;
uint32_t uscale = uint32_t(scale) << float_mantissa;
uint32_t uscale = uint32_t(bit_cast<uint8_t>(scale)) << float_mantissa;
using ComputeV2Type =
std::conditional_t<std::is_same_v<ComputeType, half_t>, fp16x2_t, bf16x2_t>;