[CK_TILE] add tensorwise quant in grouped gemm (#3007)

* add tensorwise quant in grouped gemm

* fix example issue

* update test cases

* format codes

* clang format

* use GTEST_FAIL

* fix a bug in test_grouped_gemm_util

* skip test when use wmma on grouped_quant kernel

* change cmake

* change code based on comments

---------

Co-authored-by: ThomasNing <thomas.ning@amd.com>
This commit is contained in:
kyle-256
2025-10-24 22:41:54 +08:00
committed by GitHub
parent 6bbc05e1bd
commit 3c12a02827
11 changed files with 671 additions and 68 deletions

View File

@@ -393,6 +393,13 @@ struct QuantGroupedGemmKernel
aq_block_window,
bq_block_window);
}
else if constexpr(kQuantType == QuantType::TensorQuant)
{
const AccDataType aq_scale = type_convert<AccDataType>(*aq_ptr);
const AccDataType bq_scale = type_convert<AccDataType>(*bq_ptr);
EpiloguePipeline{}(
c_block_window, c_block_tile, c_block_window, smem_ptr_0, aq_scale, bq_scale);
}
}
// For persistent kernels