initial cuda build

This commit is contained in:
Chao Liu
2018-10-22 11:51:10 -05:00
parent d51b81588f
commit 2f2cf35bf4
7 changed files with 179 additions and 82 deletions

View File

@@ -0,0 +1,12 @@
#pragma once
#include "device_tensor.cuh"
template <class TFloat, int NBlockDim>
__global__ void direct_convolution(DeviceTensorDescriptor in_desc,
TFloat* const in,
DeviceTensorDescriptor wei_desc,
TFloat* const wei,
DeviceTensorDescriptor out_desc,
TFloat* out)
{
}