From 221862c912677a94bde5fb375d4cfb54262bd106 Mon Sep 17 00:00:00 2001 From: Rostyslav Geyyer Date: Wed, 19 Mar 2025 20:23:05 +0000 Subject: [PATCH] Add more debug info --- include/ck/utility/amd_xdlops.hpp | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/include/ck/utility/amd_xdlops.hpp b/include/ck/utility/amd_xdlops.hpp index 1fbedde266..ab23c1a128 100644 --- a/include/ck/utility/amd_xdlops.hpp +++ b/include/ck/utility/amd_xdlops.hpp @@ -520,6 +520,9 @@ struct intrin_mfma_f32_32x32x64f8f6f4<32, 32> using arg_type = int32x8_t; + printf("!!!!!!! %d %d %d %d ", arg_a[0], arg_a[1], arg_a[2], arg_a[3]); + printf("??????? %d %d %d %d ", arg_b[0], arg_b[1], arg_b[2], arg_b[3]); + reg_c.template AsType()(Number<0>{}) = __builtin_amdgcn_mfma_scale_f32_32x32x64_f8f6f4( arg_type{arg_a[0], arg_a[1], arg_a[2], arg_a[3], 0, 0, 0, 0}, @@ -588,6 +591,9 @@ struct intrin_mfma_scale_f32_32x32x64f8f6f4<32, 32> using arg_type = int32x8_t; + printf("!!!!!!! %d %d %d %d ", arg_a[0], arg_a[1], arg_a[2], arg_a[3]); + printf("??????? %d %d %d %d ", arg_b[0], arg_b[1], arg_b[2], arg_b[3]); + reg_c.template AsType()(Number<0>{}) = __builtin_amdgcn_mfma_scale_f32_32x32x64_f8f6f4( arg_type{arg_a[0], arg_a[1], arg_a[2], arg_a[3], 0, 0, 0, 0}, @@ -657,6 +663,9 @@ struct intrin_mfma_scale_f32_16x16x128f8f6f4<16, 16> using arg_type = int32x8_t; + printf("!!!!!!! %d %d %d %d ", arg_a[0], arg_a[1], arg_a[2], arg_a[3]); + printf("??????? %d %d %d %d ", arg_b[0], arg_b[1], arg_b[2], arg_b[3]); + reg_c.template AsType()(Number<0>{}) = __builtin_amdgcn_mfma_scale_f32_16x16x128_f8f6f4( arg_type{arg_a[0], arg_a[1], arg_a[2], arg_a[3], 0, 0, 0, 0}, @@ -722,8 +731,6 @@ struct intrin_mfma_f32_16x16x128f8f6f4<16, 16> using arg_type = int32x8_t; - static_assert(0 == 0); - printf("!!!!!!! %d %d %d %d ", arg_a[0], arg_a[1], arg_a[2], arg_a[3]); printf("??????? %d %d %d %d ", arg_b[0], arg_b[1], arg_b[2], arg_b[3]);