mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-16 19:09:59 +00:00
Using __builtin_amdgcn_rcpf in siLU function
This commit is contained in:
@@ -247,7 +247,7 @@ struct HstuAttentionFwdPipelineQRKSVS
|
||||
const auto f_silu = [](CompDataType& x) {
|
||||
const auto neg_one = ck_tile::type_convert<CompDataType>(-1.0f);
|
||||
|
||||
return x = x / (neg_one - exp(x));
|
||||
x = x * __builtin_amdgcn_rcpf(neg_one - exp(x));
|
||||
};
|
||||
|
||||
using OaccBlockTileType = decltype(gemm_1.MakeCBlockTile());
|
||||
|
||||
Reference in New Issue
Block a user