[CK_BUILDER] Improve CK Builder and CK Builder tests (#3382)

* Remove stale documentation. * Add placeholder for conv algorithm design description. Add link to conv factory description. * Improve testing transfer parameters. * Python script to check the block tilings. * Improve tests and conv types serialization. * Change representation of boolean values from 1/0 to true/false in instance strings. * Change representation of boolean values from 1/0 to true/false in conv algorithm types. * Test code improvements. * Improve covn descriptions tests. * Improve conv signature definition in conv fwd builder tests. * clang-format. * Remove obsolete script. * Revert StaticAssertTypeEq changes in conv layout tests. * Remove obsolete using declaration. --------- Co-authored-by: Ville Pietilä <>
2026-04-20 06:49:15 +00:00 · 2025-12-11 09:50:00 +02:00
parent 6d25525adc
commit d66e5f667c
33 changed files with 1568 additions and 1042 deletions
--- a/experimental/builder/test/utils/conv_algorithm_type_utils.hpp
+++ b/experimental/builder/test/utils/conv_algorithm_type_utils.hpp
@@ -0,0 +1,346 @@
+// Copyright (c) Advanced Micro Devices, Inc., or its affiliates.
+// SPDX-License-Identifier: MIT
+
+#pragma once
+
+#include "../impl/conv_algorithm_types.hpp"
+#include <sstream>
+#include <array>
+
+namespace ck_tile::builder::test {
+
+namespace ckb = ck_tile::builder;
+
+// Helper function to convert arrays to Seq(...) format
+template <typename T, size_t N>
+std::string array_to_seq(const std::array<T, N>& arr)
+{
+    std::ostringstream oss;
+    oss << "Seq(";
+    for(size_t i = 0; i < N; ++i)
+    {
+        if(i > 0)
+            oss << ",";
+        oss << arr[i];
+    }
+    oss << ")";
+    return oss.str();
+}
+
+// Base template - will cause compilation error for unsupported types
+template <typename T>
+std::string to_string(T)
+{
+    static_assert(sizeof(T) == 0, "Unsupported type");
+    return "";
+}
+
+// Template specializations for enum types
+
+template <>
+inline std::string to_string<PipelineVersion>(PipelineVersion t)
+{
+    std::ostringstream oss;
+    oss << t;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<PipelineScheduler>(PipelineScheduler t)
+{
+    std::ostringstream oss;
+    oss << t;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<ConvFwdSpecialization>(ConvFwdSpecialization t)
+{
+    std::ostringstream oss;
+    oss << t;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<GemmSpecialization>(GemmSpecialization t)
+{
+    std::ostringstream oss;
+    oss << t;
+    return oss.str();
+}
+
+// Template specializations for struct types
+
+template <>
+inline std::string to_string<MNK<size_t>>(MNK<size_t> t)
+{
+    return array_to_seq(std::array<size_t, 3>{t.m, t.n, t.k});
+}
+
+template <>
+inline std::string to_string<ThreadBlock>(ThreadBlock t)
+{
+    std::ostringstream oss;
+    oss << t.block_size << "," << t.tile_size.m << "," << t.tile_size.n << "," << t.tile_size.k;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<GridwiseXdlGemm>(GridwiseXdlGemm t)
+{
+    std::ostringstream oss;
+    oss << t.ak1 << "," << t.bk1 << "," << t.m_per_xdl << "," << t.n_per_xdl << ","
+        << t.m_xdl_per_wave << "," << t.n_xdl_per_wave;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<GridwiseWmmaGemm>(GridwiseWmmaGemm t)
+{
+    std::ostringstream oss;
+    oss << t.k1 << "," << t.m_per_wmma << "," << t.n_per_wmma << "," << t.m_wmma_per_wave << ","
+        << t.n_wmma_per_wave;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<BlockGemm>(BlockGemm t)
+{
+    std::ostringstream oss;
+    oss << to_string(t.scheduler) << "," << to_string(t.pipeline_version);
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<BlockTransfer>(BlockTransfer t)
+{
+    return array_to_seq(std::array<size_t, 3>{t.k0, t.m_n, t.k1});
+}
+
+template <>
+inline std::string to_string<ThreadCluster>(ThreadCluster t)
+{
+    return array_to_seq(
+        std::array<size_t, 4>{t.m_block, t.m_wave_per_xdl, t.n_block, t.n_wave_per_xdl});
+}
+
+template <>
+inline std::string to_string<LdsTransfer>(LdsTransfer t)
+{
+    std::ostringstream oss;
+    oss << t.src_vector_dim << "," << t.src_scalar_per_vector << "," << t.lds_dst_scalar_per_vector
+        << "," << (t.lds_padding ? "true" : "false") << ","
+        << (t.is_direct_load ? "true" : "false");
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<AccessOrder>(AccessOrder t)
+{
+    return array_to_seq(t.order);
+}
+
+template <>
+inline std::string to_string<TransferAB>(TransferAB t)
+{
+    std::ostringstream oss;
+    oss << to_string(t.block_transfer) << "," << to_string(t.block_transfer_access_order) << ","
+        << to_string(t.src_access_order) << "," << t.lds_transfer.src_vector_dim << ","
+        << t.lds_transfer.src_scalar_per_vector << "," << t.lds_transfer.lds_dst_scalar_per_vector
+        << "," << (t.lds_transfer.lds_padding ? "true" : "false");
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<TransferC>(TransferC t)
+{
+    std::ostringstream oss;
+    oss << t.epilogue.m_xdl_per_wave_per_shuffle << "," << t.epilogue.n_per_wave_per_shuffle << ","
+        << to_string(t.thread_cluster_dims) << "," << t.epilogue.scalar_per_vector;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<TransferABC>(TransferABC t)
+{
+    std::ostringstream oss;
+    oss << to_string(t.a) << "," << to_string(t.b) << "," << to_string(t.c);
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<DlThreadConfig>(DlThreadConfig t)
+{
+    std::ostringstream oss;
+    oss << t.k1 << "," << t.m1_per_thread << "," << t.n1_per_thread << "," << t.k_per_thread;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<DlThreadCluster>(DlThreadCluster t)
+{
+    std::ostringstream oss;
+    oss << array_to_seq(t.m1_xs) << "," << array_to_seq(t.n1_xs);
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<DlBlockTransfer>(DlBlockTransfer t)
+{
+    std::ostringstream oss;
+    oss << array_to_seq(t.thread_slice_lengths) << "," << array_to_seq(t.thread_cluster_lengths)
+        << "," << array_to_seq(t.thread_cluster_arrange_order) << ","
+        << array_to_seq(t.src_access_order) << "," << array_to_seq(t.src_vector_tensor_lengths)
+        << "," << array_to_seq(t.src_vector_tensor_contiguous_dim_order) << ","
+        << array_to_seq(t.dst_vector_tensor_lengths);
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<DlEpilogue>(DlEpilogue t)
+{
+    std::ostringstream oss;
+    oss << array_to_seq(t.src_dst_access_order) << "," << t.src_dst_vector_dim << ","
+        << t.dst_scalar_per_vector;
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<DlBlockTransferAB>(DlBlockTransferAB t)
+{
+    return to_string(t.block_transfer);
+}
+
+template <>
+inline std::string to_string<DlBlockTransferC>(DlBlockTransferC t)
+{
+    return to_string(t.epilogue);
+}
+
+template <>
+inline std::string to_string<DlTransferABC>(DlTransferABC t)
+{
+    std::ostringstream oss;
+    oss << to_string(t.a) << "," << to_string(t.b) << "," << to_string(t.c);
+    return oss.str();
+}
+
+// Template specializations for factory wrapper types
+
+template <>
+inline std::string to_string<ThreadBlock_>(ThreadBlock_ t)
+{
+    return to_string(t.thread_block);
+}
+
+template <>
+inline std::string to_string<XdlGemm_>(XdlGemm_ t)
+{
+    return to_string(t.gridwise_gemm);
+}
+
+template <>
+inline std::string to_string<WmmaGemm_>(WmmaGemm_ t)
+{
+    return to_string(t.gridwise_gemm);
+}
+
+template <>
+inline std::string to_string<Transfer_>(Transfer_ t)
+{
+    return to_string(t.transfer);
+}
+
+template <>
+inline std::string to_string<ConvSpecialization_>(ConvSpecialization_ t)
+{
+    std::ostringstream oss;
+    oss << to_string(t.fwd_specialization) << "," << to_string(t.gemm_specialization);
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<Prefetch_>(Prefetch_ t)
+{
+    std::ostringstream oss;
+    oss << t.num_gemm_k_prefetch_stages << "," << t.num_groups_to_merge << ","
+        << to_string(t.loop_scheduler);
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<BlockGemm_>(BlockGemm_ t)
+{
+    return to_string(t.block_gemm);
+}
+
+template <>
+inline std::string to_string<DlThreadConfig_>(DlThreadConfig_ t)
+{
+    return to_string(t.thread_config);
+}
+
+template <>
+inline std::string to_string<DlThreadCluster_>(DlThreadCluster_ t)
+{
+    return to_string(t.thread_cluster);
+}
+
+template <>
+inline std::string to_string<DlTransfer_>(DlTransfer_ t)
+{
+    return to_string(t.transfer);
+}
+
+// Template specializations for algorithm types
+
+template <>
+inline std::string to_string<ConvAlgorithm_DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle>(
+    ConvAlgorithm_DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle t)
+{
+    std::ostringstream oss;
+    oss << to_string(static_cast<ThreadBlock_>(t)) << "," << to_string(static_cast<XdlGemm_>(t))
+        << "," << to_string(static_cast<Transfer_>(t));
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<ConvAlgorithm_DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3>(
+    ConvAlgorithm_DeviceGroupedConvFwdMultipleABD_Xdl_CShuffle_V3 t)
+{
+    std::ostringstream oss;
+    oss << to_string(static_cast<ThreadBlock_>(t)) << "," << to_string(static_cast<XdlGemm_>(t))
+        << "," << to_string(static_cast<Transfer_>(t));
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<ConvAlgorithm_DeviceGroupedConvFwdMultipleD_Wmma_CShuffle>(
+    ConvAlgorithm_DeviceGroupedConvFwdMultipleD_Wmma_CShuffle t)
+{
+    std::ostringstream oss;
+    oss << to_string(static_cast<ThreadBlock_>(t)) << "," << to_string(static_cast<WmmaGemm_>(t))
+        << "," << to_string(static_cast<Transfer_>(t));
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<ConvAlgorithm_DeviceGroupedConvFwdDlMultipleD_NHWC_KYXC_NHWK>(
+    ConvAlgorithm_DeviceGroupedConvFwdDlMultipleD_NHWC_KYXC_NHWK t)
+{
+    std::ostringstream oss;
+    oss << to_string(static_cast<ThreadBlock_>(t)) << ","
+        << to_string(static_cast<DlThreadConfig_>(t)) << ","
+        << to_string(static_cast<DlThreadCluster_>(t)) << ","
+        << to_string(static_cast<DlTransfer_>(t));
+    return oss.str();
+}
+
+template <>
+inline std::string to_string<ConvAlgorithm_DeviceGroupedConvFwdMultipleD_Xdl_CShuffle_Large_Tensor>(
+    ConvAlgorithm_DeviceGroupedConvFwdMultipleD_Xdl_CShuffle_Large_Tensor t)
+{
+    return to_string(t.base_algorithm);
+}
+
+} // namespace ck_tile::builder::test