Enable padding blockscale for abquant (#3453)

* Enable padding blockscale for abquant * run clang-format * Reduce unnecessary testing * remove cout
2026-04-20 06:49:15 +00:00 · 2025-12-25 01:12:40 +08:00
parent 1c3151963b
commit 7f68f3c4fa
8 changed files with 128 additions and 138 deletions
--- a/include/ck_tile/ops/gemm_quant/kernel/gemm_quant_kernel.hpp
+++ b/include/ck_tile/ops/gemm_quant/kernel/gemm_quant_kernel.hpp
@@ -412,32 +412,6 @@ struct QuantGemmKernel
            return false;
        }

-        if constexpr(kQuantType == QuantType::AQuantGrouped ||
-                     kQuantType == QuantType::ABQuantGrouped)
-        {
-            if(kargs.QK_A % GemmPipeline::GetVectorSizeAQ() != 0)
-            {
-                if(ck_tile::EnvIsEnabled(CK_TILE_ENV(CK_TILE_LOGGING)))
-                {
-                    CK_TILE_ERROR("K_A is not a multiple of vector load size for A tensor!");
-                }
-                return false;
-            }
-        }
-
-        if constexpr(kQuantType == QuantType::BQuantGrouped ||
-                     kQuantType == QuantType::ABQuantGrouped)
-        {
-            if(kargs.QK_B % GemmPipeline::GetVectorSizeBQ() != 0)
-            {
-                if(ck_tile::EnvIsEnabled(CK_TILE_ENV(CK_TILE_LOGGING)))
-                {
-                    CK_TILE_ERROR("K_B is not a multiple of vector load size for B tensor!");
-                }
-                return false;
-            }
-        }
-
        if constexpr(std::is_same_v<ALayout, tensor_layout::gemm::RowMajor>)
        {
            if(kargs.K % (TilePartitioner::KPerBlock * kargs.k_batch) != 0 &&