diff --git a/include/ck_tile/ops/rmsnorm2d/kernel/rmsnorm2d_fwd_kernel.hpp b/include/ck_tile/ops/rmsnorm2d/kernel/rmsnorm2d_fwd_kernel.hpp index 6207c24f43..99084a25e4 100644 --- a/include/ck_tile/ops/rmsnorm2d/kernel/rmsnorm2d_fwd_kernel.hpp +++ b/include/ck_tile/ops/rmsnorm2d/kernel/rmsnorm2d_fwd_kernel.hpp @@ -134,10 +134,8 @@ struct Rmsnorm2dFwd number{}, number<1>{}); - // NOTE: we don't do any pad in this kernel for loading, assume that inside kernel will - // check the max count dynamically const auto tmp2_ = pad_tensor_view( - tmp_, make_tuple(number{}, number{}), sequence{}); + tmp_, make_tuple(number{}, number{}), sequence{}); return make_tile_window( tmp2_, make_tuple(number{}, number{}), {iM, 0}); }(); @@ -151,7 +149,7 @@ struct Rmsnorm2dFwd number<1>{}); const auto tmp2_ = - pad_tensor_view(tmp_, make_tuple(number{}), sequence{}); + pad_tensor_view(tmp_, make_tuple(number{}), sequence{}); return make_tile_window(tmp2_, make_tuple(number{}), {0}); }();