mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-12 17:26:00 +00:00
added implicit gemm v1r3 lds_double_buffer NCHW * CYXK = KNHW, reworked static functionals
This commit is contained in:
@@ -19,6 +19,20 @@ struct Array
|
||||
__host__ __device__ const TData& operator[](index_t i) const { return mData[i]; }
|
||||
|
||||
__host__ __device__ TData& operator[](index_t i) { return mData[i]; }
|
||||
|
||||
__host__ __device__ auto PushBack(TData x) const
|
||||
{
|
||||
Array<TData, NSize + 1> new_array;
|
||||
|
||||
static_for<0, NSize, 1>{}([=](auto I) {
|
||||
constexpr index_t i = I.Get();
|
||||
new_array[i] = mData[i];
|
||||
});
|
||||
|
||||
new_array[NSize] = x;
|
||||
|
||||
return new_array;
|
||||
}
|
||||
};
|
||||
|
||||
template <class TData, index_t NSize, index_t... IRs>
|
||||
@@ -51,4 +65,4 @@ __host__ __device__ auto reorder_array_given_old2new(const Array<TData, NSize>&
|
||||
});
|
||||
|
||||
return new_array;
|
||||
}
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user