[ROCm/composable_kernel commit: 0597116330]
This commit is contained in:
Chao Liu
2019-01-09 19:11:45 -06:00
parent 936627209e
commit a943d79f4c
2 changed files with 3 additions and 0 deletions

View File

@@ -76,6 +76,7 @@ blockwise_4d_tensor_pointwise_operation_unary(DstDesc, Float* __restrict__ p_dst
}
}
// Function: p_dst[reorder[i0], reorder[i1], reorder[i2], reorder[i3]] = p_src[i0,i1,i2,i3]
// TODO: in order to optimize mem access for different mem type,
// need to write specialized version
template <unsigned BlockSize,

View File

@@ -11,3 +11,5 @@ struct is_same<T, T>
{
static const bool value = true;
};
__device__ unsigned get_thread_local_id() { return threadIdx.x; }