Add grouped conv fwd bias relu instances (#2179)

* Add grouped conv fwd bias relu instances

* fixes

* fix
This commit is contained in:
Bartłomiej Kocot
2025-05-09 22:52:34 +02:00
committed by GitHub
parent 6b1a339b6f
commit 6fddb5708c
33 changed files with 2477 additions and 550 deletions

View File

@@ -404,6 +404,14 @@ struct AddRelu
y = a > type_convert<bhalf_t>(0.0f) ? a : type_convert<bhalf_t>(0.0f);
};
template <>
__host__ __device__ constexpr void
operator()<bhalf_t, bhalf_t, bhalf_t>(bhalf_t& y, const bhalf_t& x0, const bhalf_t& x1) const
{
const float a = type_convert<float>(x0) + type_convert<float>(x1);
y = a > type_convert<bhalf_t>(0.0f) ? a : type_convert<bhalf_t>(0.0f);
};
template <>
__host__ __device__ constexpr void
operator()<int, int, int8_t>(int& y, const int& x0, const int8_t& x1) const