// SPDX-License-Identifier: MIT // Copyright (c) 2018-2023, Advanced Micro Devices, Inc. All rights reserved. #pragma once #include "ck_tile/core.hpp" #include "ck_tile/ops/gemm/warp/warp_gemm_impl.hpp" #include "ck_tile/ops/gemm/warp/warp_gemm_attribute_mfma.hpp" namespace ck_tile { // fp16 using WarpGemmMfmaF16F16F32M32N32K8 = WarpGemmImpl>; using WarpGemmMfmaF16F16F32M16N16K16 = WarpGemmImpl>; using WarpGemmMfmaF16F16F32M32N32K16 = WarpGemmImpl>; using WarpGemmMfmaF16F16F32M16N16K32 = WarpGemmImpl>; using WarpGemmMfmaF16F16F32M32N32K8TransposedCDistribution = WarpGemmImpl< WarpGemmAtrributeMfmaTransposedCDistribution>; using WarpGemmMfmaF16F16F32M16N16K16TransposedCDistribution = WarpGemmImpl< WarpGemmAtrributeMfmaTransposedCDistribution>; using WarpGemmMfmaF16F16F32M32N32K16TransposedCDistribution = WarpGemmImpl>; using WarpGemmMfmaF16F16F32M16N16K32TransposedCDistribution = WarpGemmImpl>; using WarpGemmMfmaF16F16F32M16N16K32SwizzleBTransposedCDistribution = WarpGemmImpl>; // bf16 using WarpGemmMfmaBf16Bf16F32M32N32K8 = WarpGemmImpl>; using WarpGemmMfmaBf16Bf16F32M16N16K16 = WarpGemmImpl>; using WarpGemmMfmaBf16Bf16F32M32N32K16 = WarpGemmImpl>; using WarpGemmMfmaBf16Bf16F32M16N16K32 = WarpGemmImpl>; using WarpGemmMfmaBf16Bf16F32M32N32K8TransposedCDistribution = WarpGemmImpl< WarpGemmAtrributeMfmaTransposedCDistribution>; using WarpGemmMfmaBf16Bf16F32M16N16K16TransposedCDistribution = WarpGemmImpl< WarpGemmAtrributeMfmaTransposedCDistribution>; using WarpGemmMfmaBf16Bf16F32M32N32K16TransposedCDistribution = WarpGemmImpl>; using WarpGemmMfmaBf16Bf16F32M16N16K32TransposedCDistribution = WarpGemmImpl>; using WarpGemmMfmaBf16Bf16F32M16N16K32SwizzleBTransposedCDistribution = WarpGemmImpl>; // fp8 using WarpGemmMfma_f32_32x32x16_fp8_fp8 = WarpGemmImpl>; using WarpGemmMfma_f32_32x32x16_fp8_bf8 = WarpGemmImpl>; using WarpGemmMfma_f32_32x32x16_bf8_fp8 = WarpGemmImpl>; using WarpGemmMfma_f32_32x32x16_bf8_bf8 = WarpGemmImpl>; using WarpGemmMfma_f32_32x32x16_fp8_fp8_CTransposed = WarpGemmImpl< WarpGemmAtrributeMfmaTransposedCDistribution>; using WarpGemmMfma_f32_32x32x16_fp8_bf8_CTransposed = WarpGemmImpl< WarpGemmAtrributeMfmaTransposedCDistribution>; using WarpGemmMfma_f32_32x32x16_bf8_fp8_CTransposed = WarpGemmImpl< WarpGemmAtrributeMfmaTransposedCDistribution>; using WarpGemmMfma_f32_32x32x16_bf8_bf8_CTransposed = WarpGemmImpl< WarpGemmAtrributeMfmaTransposedCDistribution>; } // namespace ck_tile