mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-15 02:27:57 +00:00
clang-format and remove dead code
[ROCm/composable_kernel commit: edb78a4729]
This commit is contained in:
@@ -128,42 +128,39 @@ struct BlockFmhaPipelineQSKSVS
|
||||
typename OAccElementFunction,
|
||||
typename PositionEncoding>
|
||||
CK_TILE_HOST_DEVICE auto
|
||||
// operator()(const QDramBlockWindowTmp& q_dram_block_window_tmp, // M0*K0 tile
|
||||
// const QElementFunction& q_element_func,
|
||||
// const KDramBlockWindowTmp& k_dram_block_window_tmp, // N0*K0 tile
|
||||
// const KElementFunction& k_element_func,
|
||||
// const VDramBlockWindowTmp& v_dram_block_window_tmp, // N1*K1 tile
|
||||
// const VElementFunction& v_element_func,
|
||||
// const BiasDramBlockWindowTmp& bias_dram_block_window_tmp, // M0*N0 tile
|
||||
// const BiasElementFunction& bias_element_func,
|
||||
// LSEDramBlockWindowTmp& lse_dram_window_tmp, // M0*1 tile
|
||||
// const LSEElementFunction& lse_element_func,
|
||||
// const SAccElementFunction& s_acc_element_func,
|
||||
// const PComputeElementFunction& p_compute_element_func,
|
||||
// const OAccElementFunction& o_acc_element_func,
|
||||
// FmhaMask mask,
|
||||
// PositionEncoding position_encoding,
|
||||
// float scale_s,
|
||||
// void* smem_ptr) const
|
||||
operator()(const QDramBlockWindowTmp& q_dram_block_window_tmp, // M0*K0 tile
|
||||
const QElementFunction& q_element_func,
|
||||
const KDramBlockWindowTmp& k_dram_block_window_tmp, // N0*K0 tile
|
||||
const KElementFunction& k_element_func,
|
||||
const VDramBlockWindowTmp& v_dram_block_window_tmp, // N1*K1 tile
|
||||
const VElementFunction& v_element_func,
|
||||
const BiasDramBlockWindowTmp& bias_dram_block_window_tmp, // M0*N0 tile
|
||||
const BiasElementFunction& bias_element_func,
|
||||
RandValDramBlockWindowTmp& randval_dram_block_window_tmp,
|
||||
LSEDramBlockWindowTmp& lse_dram_window_tmp, // M0*1 tile
|
||||
const LSEElementFunction& lse_element_func,
|
||||
const SAccElementFunction& s_acc_element_func,
|
||||
const PComputeElementFunction& p_compute_element_func,
|
||||
const OAccElementFunction& o_acc_element_func,
|
||||
operator()(const QDramBlockWindowTmp & q_dram_block_window_tmp, // M0*K0 tile
|
||||
const QElementFunction &
|
||||
q_element_func,
|
||||
const KDramBlockWindowTmp &
|
||||
k_dram_block_window_tmp, // N0*K0 tile
|
||||
const KElementFunction &
|
||||
k_element_func,
|
||||
const VDramBlockWindowTmp &
|
||||
v_dram_block_window_tmp, // N1*K1 tile
|
||||
const VElementFunction &
|
||||
v_element_func,
|
||||
const BiasDramBlockWindowTmp &
|
||||
bias_dram_block_window_tmp, // M0*N0 tile
|
||||
const BiasElementFunction &
|
||||
bias_element_func,
|
||||
RandValDramBlockWindowTmp &
|
||||
randval_dram_block_window_tmp,
|
||||
LSEDramBlockWindowTmp &
|
||||
lse_dram_window_tmp, // M0*1 tile
|
||||
const LSEElementFunction &
|
||||
lse_element_func,
|
||||
const SAccElementFunction &
|
||||
s_acc_element_func,
|
||||
const PComputeElementFunction &
|
||||
p_compute_element_func,
|
||||
const OAccElementFunction &
|
||||
o_acc_element_func,
|
||||
FmhaMask mask,
|
||||
PositionEncoding position_encoding,
|
||||
float scale_s,
|
||||
void* smem_ptr,
|
||||
DropoutType& dropout) const
|
||||
DropoutType &
|
||||
dropout) const
|
||||
{
|
||||
static_assert(
|
||||
std::is_same_v<QDataType, remove_cvref_t<typename QDramBlockWindowTmp::DataType>> &&
|
||||
@@ -263,12 +260,12 @@ struct BlockFmhaPipelineQSKSVS
|
||||
{seqlen_k_start, 0});
|
||||
|
||||
const auto bias_origin = bias_dram_block_window_tmp.get_window_origin();
|
||||
auto bias_dram_window = make_tile_window(
|
||||
bias_dram_block_window_tmp.get_bottom_tensor_view(),
|
||||
bias_dram_block_window_tmp.get_window_lengths(),
|
||||
{bias_origin.at(number<0>{}), seqlen_k_start}, // M/N
|
||||
Policy::template MakeBiasDramTileDistribution<decltype(gemm_0)>());
|
||||
// Policy::template MakeBiasDramTileDistribution<Problem, decltype(gemm_0)>());
|
||||
auto bias_dram_window =
|
||||
make_tile_window(bias_dram_block_window_tmp.get_bottom_tensor_view(),
|
||||
bias_dram_block_window_tmp.get_window_lengths(),
|
||||
{bias_origin.at(number<0>{}), seqlen_k_start}, // M/N
|
||||
Policy::template MakeBiasDramTileDistribution<decltype(gemm_0)>());
|
||||
// Policy::template MakeBiasDramTileDistribution<Problem, decltype(gemm_0)>());
|
||||
|
||||
auto v_dram_window =
|
||||
make_tile_window(v_dram_block_window_tmp.get_bottom_tensor_view(),
|
||||
@@ -621,41 +618,6 @@ struct BlockFmhaPipelineQSKSVS
|
||||
return o_acc;
|
||||
}
|
||||
|
||||
// template <typename QDramBlockWindowTmp,
|
||||
// typename KDramBlockWindowTmp,
|
||||
// typename VDramBlockWindowTmp,
|
||||
// typename BiasDramBlockWindowTmp,
|
||||
// typename LSEDramBlockWindowTmp,
|
||||
// typename PositionEncoding>
|
||||
// CK_TILE_HOST_DEVICE auto
|
||||
// operator()(const QDramBlockWindowTmp& q_dram_block_window_tmp, // M0*K0 tile
|
||||
// const KDramBlockWindowTmp& k_dram_block_window_tmp, // N0*K0 tile
|
||||
// const VDramBlockWindowTmp& v_dram_block_window_tmp, // N1*K1 tile
|
||||
// const BiasDramBlockWindowTmp& bias_dram_block_window_tmp, // M0*N0 tile
|
||||
// LSEDramBlockWindowTmp& lse_dram_block_window_tmp, // M0*1 tile
|
||||
// FmhaMask mask,
|
||||
// PositionEncoding position_encoding,
|
||||
// float scale_s,
|
||||
// void* smem_ptr) const
|
||||
// {
|
||||
// return operator()(q_dram_block_window_tmp,
|
||||
// identity{},
|
||||
// k_dram_block_window_tmp,
|
||||
// identity{},
|
||||
// v_dram_block_window_tmp,
|
||||
// identity{},
|
||||
// bias_dram_block_window_tmp,
|
||||
// identity{},
|
||||
// lse_dram_block_window_tmp,
|
||||
// identity{},
|
||||
// identity{},
|
||||
// identity{},
|
||||
// identity{},
|
||||
// mask,
|
||||
// position_encoding,
|
||||
// scale_s,
|
||||
// smem_ptr);
|
||||
// }
|
||||
template <typename QDramBlockWindowTmp,
|
||||
typename KDramBlockWindowTmp,
|
||||
typename VDramBlockWindowTmp,
|
||||
|
||||
@@ -471,7 +471,7 @@ struct BlockFmhaPipelineQXKSVSCustomPolicy : BlockFmhaPipelineQXCustomPolicy<QLo
|
||||
|
||||
template <typename Problem, index_t IBuf = 0>
|
||||
CK_TILE_HOST_DEVICE static constexpr auto
|
||||
MakeKLdsStoreBlockDescriptor(number<IBuf> = number<0>{})
|
||||
MakeKLdsStoreBlockDescriptor(number<IBuf> = number<0>{})
|
||||
{
|
||||
// K is always k-major, we use async-copy to load into LDS
|
||||
constexpr index_t kNPerBlock = Problem::BlockFmhaShape::kN0;
|
||||
@@ -526,7 +526,7 @@ struct BlockFmhaPipelineQXKSVSCustomPolicy : BlockFmhaPipelineQXCustomPolicy<QLo
|
||||
#if K_LDS_LOAD_USE_OFFSET_TRANSFORM
|
||||
template <typename Problem, index_t IBuf = 0>
|
||||
CK_TILE_HOST_DEVICE static constexpr auto
|
||||
MakeKLdsLoadBlockDescriptor(number<IBuf> = number<0>{})
|
||||
MakeKLdsLoadBlockDescriptor(number<IBuf> = number<0>{})
|
||||
{
|
||||
// K is always k-major, we use async-copy to load into LDS
|
||||
constexpr index_t kNPerBlock = Problem::BlockFmhaShape::kN0;
|
||||
|
||||
Reference in New Issue
Block a user