mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-06-29 11:16:59 +00:00
fix coredump in e2e test
This commit is contained in:
@@ -1576,7 +1576,7 @@ struct GridwiseMoeGemm
|
||||
static_for<0, EMRepeats, 1>{}([&](auto m0) {
|
||||
const index_t fused_token = p_sorted_token_ids[c_token_pos + m0];
|
||||
index_t token_offset = fused_token & 0xffffff;
|
||||
float weight = p_sorted_weights_0[token_offset * problem.StrideDs[0]];
|
||||
float weight = token_offset < problem.NumTokens? p_sorted_weights_0[token_offset * problem.StrideDs[0]] : 1.0;
|
||||
if constexpr(IsInputGemm)
|
||||
{
|
||||
token_offset = token_offset * problem.TopK + (fused_token >> 24);
|
||||
|
||||
Reference in New Issue
Block a user