Add asm for no-loop v3_128x128x128

This commit is contained in:
OscarXu
2025-05-06 10:47:29 +08:00
parent efbb85be2a
commit e7fe8587f6
2 changed files with 24 additions and 24 deletions

View File

@@ -491,30 +491,30 @@ struct DeviceMoeGemmBlockScale
RunKernel(kernel);
}
}
// else if constexpr(BlkGemmPipelineVer == BlockGemmPipelineVersion::v2 ||
// BlkGemmPipelineVer == BlockGemmPipelineVersion::v3)
// {
// if(GridwiseGemm::CalculateKBlockLoopTailNum(K_split) == TailNumber::Odd)
// {
// const auto kernel = kernel_moe_gemm_2lds<GridwiseGemm,
// false,
// MemoryDataOp,
// minimum_occupancy,
// IsInputGemm,
// TailNumber::Odd>;
// RunKernel(kernel);
// }
// else
// {
// const auto kernel = kernel_moe_gemm_2lds<GridwiseGemm,
// false,
// MemoryDataOp,
// minimum_occupancy,
// IsInputGemm,
// TailNumber::Even>;
// RunKernel(kernel);
// }
// }
else if constexpr(BlkGemmPipelineVer == BlockGemmPipelineVersion::v2 ||
BlkGemmPipelineVer == BlockGemmPipelineVersion::v3)
{
if(GridwiseGemm::CalculateKBlockLoopTailNum(K_split) == TailNumber::Odd)
{
const auto kernel = kernel_moe_gemm_2lds<GridwiseGemm,
false,
MemoryDataOp,
minimum_occupancy,
IsInputGemm,
TailNumber::Odd>;
RunKernel(kernel);
}
else
{
const auto kernel = kernel_moe_gemm_2lds<GridwiseGemm,
false,
MemoryDataOp,
minimum_occupancy,
IsInputGemm,
TailNumber::Even>;
RunKernel(kernel);
}
}
}
#endif
#endif