mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 22:39:03 +00:00
* Update include path to break the cyclic dep issue * Use ck_tile::permute_vectors_i4x4_b in tile engine --------- Co-authored-by: Damien Lejeune <damien.lejeune@amd.com> Co-authored-by: Adam Osewski <19374865+aosewski@users.noreply.github.com>
18 lines
791 B
C++
18 lines
791 B
C++
// SPDX-License-Identifier: MIT
|
|
// Copyright (c) 2018-2025, Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
#pragma once
|
|
|
|
#include "ck_tile/ops/reduce/block/block_reduce.hpp"
|
|
#include "ck_tile/ops/reduce/block/block_reduce2d.hpp"
|
|
#include "ck_tile/ops/reduce/block/block_reduce2d_problem.hpp"
|
|
#include "ck_tile/ops/reduce/kernel/reduce2d_kernel.hpp"
|
|
#include "ck_tile/ops/reduce/pipeline/reduce2d_default_policy.hpp"
|
|
#include "ck_tile/ops/reduce/pipeline/reduce2d_problem.hpp"
|
|
#include "ck_tile/ops/reduce/pipeline/reduce2d_shape.hpp"
|
|
#include "ck_tile/ops/common/generic_2d_block_shape.hpp"
|
|
#include "ck_tile/ops/common/load_interleaved_pk_type.hpp"
|
|
#include "ck_tile/ops/common/streamk_common.hpp"
|
|
#include "ck_tile/ops/common/tensor_layout.hpp"
|
|
#include "ck_tile/ops/common/utils.hpp"
|