Implemented group level static quantization for s8s8s32of32|bf16 APIs

Details: - Group quantization is technique to improve accuracy where scale factors to quantize inputs and weights varies at group level instead of per channel and per tensor level. - Added new bench files to test GEMM with symmetric static quantization. - Added new get_size and reorder functions to account for storing sum of col-values separately per group. - Added new framework, kernels to support the same. - The scalefactors could be of type float or bf16. AMD-Internal:[SWLCSG-3274] Change-Id: I3e69ecd56faa2679a4f084031d35ffb76556230f
2026-05-05 15:01:13 +00:00 · 2025-02-19 05:59:07 +00:00
parent 99770558bb
commit 7243a5d521
25 changed files with 41770 additions and 52 deletions
--- a/addon/aocl_gemm/frame/lpgemm_5loop_interface_apis.h
+++ b/addon/aocl_gemm/frame/lpgemm_5loop_interface_apis.h
@@ -126,6 +126,35 @@ void lpgemm_rowvar_ ## LP_SFX \

 LPGEMM_5LOOP1(bfloat16,int8_t,float,bf16s4f32of32);

+#define LPGEMM_5LOOP2(A_type,B_type,C_type,LP_SFX) \
+void lpgemm_rowvar_ ## LP_SFX \
+     ( \
+       const dim_t           m, \
+       const dim_t           n, \
+       const dim_t           k, \
+       const A_type*         a, \
+       const dim_t           rs_a, \
+       const dim_t           cs_a, \
+       const AOCL_MEMORY_TAG mtag_a, \
+       const B_type*         b, \
+       const dim_t           rs_b, \
+       const dim_t           cs_b, \
+       const AOCL_MEMORY_TAG mtag_b, \
+       float*               c, \
+       const dim_t           rs_c, \
+       const dim_t           cs_c, \
+       const C_type          alpha, \
+       const C_type          beta, \
+       rntm_t*               rntm, \
+       lpgemm_thrinfo_t*     thread, \
+       lpgemm_cntx_t*        lcntx, \
+       lpgemm_group_post_op* grp_post_op_list, \
+       lpgemm_post_op*       post_op_list, \
+       AOCL_STORAGE_TYPE     c_downscale \
+     ) \
+
+LPGEMM_5LOOP2(int8_t,int8_t,int32_t,s8s8s32o32_sym_quant);
+
 #define LPGEMM_5LOOP_AVX2(A_type,B_type,C_type,LP_SFX) \
 void lpgemm_rowvar_avx2_ ## LP_SFX \
     ( \