Fix kBlockSize

This commit is contained in:
Damien Lejeune
2026-01-21 07:42:59 -05:00
parent 557a8d3f21
commit 9a743139af
2 changed files with 4 additions and 5 deletions

View File

@@ -24,7 +24,6 @@ namespace ck_tile {
// static constexpr index_t Repeat_N = Repeat_N;
// };
template <typename BlockWarps, // num warps along seq<M, N>
typename BlockTile, // block size, seq<M, N>
typename WarpTile, // warp size, seq<M, N>
@@ -56,8 +55,7 @@ struct SinkhornKnoppShape
static constexpr index_t Repeat_M = Block_M * RepeatInWarp_M / (WarpPerBlock_M * Warp_M);
static constexpr index_t Repeat_N = Block_N * RepeatInWarp_N / (WarpPerBlock_N * Warp_N);
// static constexpr index_t BlockSize = ck_tile::get_warp_size();
static constexpr index_t BlockSize = 1; // TODO
static constexpr index_t BlockSize = ck_tile::get_warp_size();
};
template <typename _XDataType,

View File

@@ -75,7 +75,7 @@ struct SinkhornKnoppKernelDummyNonStochastic
return tensor;
}
CK_TILE_DEVICE void operator()([[maybe_unused]]const SinkhornKnoppArgs& args) const
CK_TILE_DEVICE void operator()([[maybe_unused]] const SinkhornKnoppArgs& args) const
{
// using S = Problem::BlockShape;
@@ -83,7 +83,8 @@ struct SinkhornKnoppKernelDummyNonStochastic
// const auto x_desc = make_naive_tensor_descriptor(make_tuple(args.input_m, args.input_m),
// make_tuple(args.input_m, 1),
// number<4>{}, // TODO: Hardcoded vectorization, we should calculate it!
// number<4>{}, // TODO: Hardcoded
// vectorization, we should calculate it!
// number<1>{});
// auto buffer_view = make_buffer_view<address_space_enum::global>(