adding implicit gemm v3

[ROCm/composable_kernel commit: b7d052459d]
This commit is contained in:
Chao Liu
2019-05-15 09:58:17 -05:00
parent aeeefc1de3
commit ac7741cc7c
29 changed files with 977 additions and 296 deletions

View File

@@ -85,7 +85,7 @@ struct TensorDescriptor
{
}
std::size_t GetDimension() const;
std::size_t GetNumOfDimension() const;
std::size_t GetElementSize() const;
std::size_t GetElementSpace() const;
@@ -95,7 +95,7 @@ struct TensorDescriptor
template <class... Is>
std::size_t Get1dIndex(Is... is) const
{
assert(sizeof...(Is) == this->GetDimension());
assert(sizeof...(Is) == this->GetNumOfDimension());
std::initializer_list<std::size_t> iss{static_cast<std::size_t>(is)...};
return std::inner_product(iss.begin(), iss.end(), mStrides.begin(), std::size_t{0});
}
@@ -206,7 +206,7 @@ struct Tensor
template <class G>
void GenerateTensorValue(G g, std::size_t num_thread = 1)
{
switch(mDesc.GetDimension())
switch(mDesc.GetNumOfDimension())
{
case 1:
{