mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-12 01:10:17 +00:00
nvidia build
This commit is contained in:
@@ -19,8 +19,6 @@ namespace ck {
|
||||
enum address_space_t
|
||||
{
|
||||
generic = 0,
|
||||
vgpr = 1,
|
||||
lds = 2,
|
||||
global = 3
|
||||
};
|
||||
|
||||
|
||||
@@ -21,8 +21,6 @@ namespace ck {
|
||||
enum address_space_t
|
||||
{
|
||||
generic = 0,
|
||||
vgpr = generic,
|
||||
lds = generic,
|
||||
global = generic
|
||||
};
|
||||
|
||||
@@ -39,6 +37,17 @@ using index_t = int32_t;
|
||||
using float2_t = float2;
|
||||
using float4_t = float4;
|
||||
|
||||
// data type conversion
|
||||
template <typename T>
|
||||
struct type_convert
|
||||
{
|
||||
template <typename X>
|
||||
__device__ T operator()(const X& x) const
|
||||
{
|
||||
return static_cast<T>(x);
|
||||
}
|
||||
};
|
||||
|
||||
template <class T>
|
||||
__device__ void fused_multiply_accumulate(T& d, const T& s0, const T& s1)
|
||||
{
|
||||
|
||||
Reference in New Issue
Block a user