fix undefined behaviour in softmax kernel (#3683)

Co-authored-by: root <zoltan.lakatos@streamhpc.com>
This commit is contained in:
Zoltán Lakatos
2026-01-30 08:22:54 +01:00
committed by GitHub
parent f3d8b7210f
commit 565fea2645

View File

@@ -26,7 +26,7 @@ __global__ void kernel_softmax(const GridDesc_M_K in_grid_desc_m_k,
AccDataType alpha,
const InDataType* const __restrict__ p_in_value_global,
AccDataType beta,
OutDataType* const __restrict__ p_out_value_global)
OutDataType* p_out_value_global)
{
GridwiseReduction::Run(in_grid_desc_m_k,
out_grid_desc_m_k,
@@ -91,7 +91,7 @@ struct GridwiseSoftmax_mk_to_mk
AccDataType alpha,
const InDataType* const __restrict__ p_in_value_global,
AccDataType beta,
OutDataType* const __restrict__ p_out_value_global)
OutDataType* p_out_value_global)
{
if constexpr(SweepOnce)
{