mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-04 05:31:24 +00:00
use int64_t as expert stride to avoid overflow
This commit is contained in:
@@ -644,7 +644,8 @@ struct MoeFlatmmKernel
|
||||
});
|
||||
|
||||
const SplitKBatchOffset splitk_batch_offset(kargs);
|
||||
const index_t expert_stride = __builtin_amdgcn_readfirstlane(kargs.N * kargs.K);
|
||||
const long_index_t expert_stride =
|
||||
__builtin_amdgcn_readfirstlane(long_index_t(kargs.N) * kargs.K);
|
||||
|
||||
const ADataType* a_ptr =
|
||||
static_cast<const ADataType*>(kargs.a_ptr) + splitk_batch_offset.a_k_split_offset;
|
||||
|
||||
Reference in New Issue
Block a user