mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-13 09:45:56 +00:00
initial cuda build
This commit is contained in:
12
src/include/direct_convolution.cuh
Normal file
12
src/include/direct_convolution.cuh
Normal file
@@ -0,0 +1,12 @@
|
||||
#pragma once
|
||||
#include "device_tensor.cuh"
|
||||
|
||||
template <class TFloat, int NBlockDim>
|
||||
__global__ void direct_convolution(DeviceTensorDescriptor in_desc,
|
||||
TFloat* const in,
|
||||
DeviceTensorDescriptor wei_desc,
|
||||
TFloat* const wei,
|
||||
DeviceTensorDescriptor out_desc,
|
||||
TFloat* out)
|
||||
{
|
||||
}
|
||||
Reference in New Issue
Block a user