mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-02 20:51:23 +00:00
[CK_TILE] optimize moe-sorting kernel (#1771)
* opt moe sorting * remove commented code
This commit is contained in:
@@ -9,15 +9,20 @@
|
||||
|
||||
namespace ck_tile {
|
||||
|
||||
template <typename IndexType_, typename WeightType_, index_t InternalLoadUnroll_>
|
||||
template <typename IndexType_,
|
||||
typename WeightType_,
|
||||
index_t InternalLoadUnroll_,
|
||||
index_t ExpertTile_ = 0>
|
||||
struct MoeSortingProblem
|
||||
{
|
||||
// TODO: this kernel only support warp per row
|
||||
using WeightType = remove_cvref_t<WeightType_>;
|
||||
using IndexType = remove_cvref_t<IndexType_>;
|
||||
|
||||
static constexpr index_t WarpSize = get_warp_size();
|
||||
static constexpr index_t WarpsPerBlock = 1;
|
||||
static constexpr index_t InternalLoadUnroll = InternalLoadUnroll_;
|
||||
static constexpr index_t WarpSize = get_warp_size();
|
||||
static constexpr index_t WarpsPerBlock = 1;
|
||||
static constexpr index_t InternalLoadUnroll =
|
||||
InternalLoadUnroll_; // TODO: need better design(like tile size)
|
||||
static constexpr index_t ExpertTile = ExpertTile_; // TODO: only used in store out
|
||||
};
|
||||
} // namespace ck_tile
|
||||
|
||||
Reference in New Issue
Block a user