Cutlass
CUDA Templates for Linear Algebra Subroutines and Solvers
Public Types | List of all members
cutlass::gemm::HgemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ > Struct Template Reference

#include <hgemm_traits.h>

Inheritance diagram for cutlass::gemm::HgemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >:
cutlass::gemm::GemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >

Public Types

typedef GemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ > Base
 The base config. More...
 
typedef HgemmCrosswiseGlobalTileTraits< GemmOperand::kA, MatrixLayout::kRowMajor, half const, Shape< 1, GemmConfig_::OutputTile::kW, GemmConfig_::OutputTile::kD >, Shape< 1, GemmConfig_::kThreads/GemmConfig_::OutputTile::kD, GemmConfig_::OutputTile::kD >, GemmConfig_::kScalarsPerLdgA > GlobalTileTraits
 The traits class to build the iterator to load data from global memory for A^T. More...
 
typedef GemmSharedStoreWithSkewTileAbTraits< half, Shape< GemmConfig_::kStages, GemmConfig_::OutputTile::kD/GemmConfig_::InstructionShape::kD, GemmConfig_::OutputTile::kW *GemmConfig_::InstructionShape::kD >, typename GlobalTileTraits::Threads, 2, 128/sizeof(half)/GlobalTileTraits::Threads::kW/2 > SharedStoreTileTraits
 The traits class to build the iterator to store data to shared memory for A^T. More...
 
typedef GemmSharedLoadTileATraits< half const, typename GemmConfig_::OutputTile, typename GemmConfig_::Warps, typename GemmConfig_::MultiplyAdd::ThreadsPerWarp, typename GemmConfig_::InstructionShape, GemmConfig_::kStages, 8, SharedStoreTileTraits::kSkew > SharedLoadTileTraits
 The traits class to build the iterator to load from shared memory for A^T. More...
 
- Public Types inherited from cutlass::gemm::GemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >
typedef GemmConfig_::ScalarA Scalar
 The input scalar. More...
 
typedef GemmConfig_::MultiplyAdd::ScalarA MultiplyAddScalar
 The scalar stored in shared memory. More...
 
typedef GemmGlobalTileTraits< GemmOperand::kA, MatrixLayout::kRowMajor, Scalar const, Shape< 1, GemmConfig_::OutputTile::kW, GemmConfig_::OutputTile::kD >, Shape< 1, GemmConfig_::kThreads/GemmConfig_::OutputTile::kD, GemmConfig_::OutputTile::kD >, GemmConfig_::kScalarsPerLdgA > GlobalTileTraits
 The traits class to build the iterator to load data from global memory for A^T. More...
 
typedef GemmSharedStoreWithSkewTileAbTraits< MultiplyAddScalar, Shape< GemmConfig_::kStages, GemmConfig_::OutputTile::kD/GemmConfig_::InstructionShape::kD, GemmConfig_::OutputTile::kW *GemmConfig_::InstructionShape::kD >, typename GlobalTileTraits::Threads, GemmConfig_::kScalarsPerStsA, 128/sizeof(MultiplyAddScalar)/GemmConfig_::kScalarsPerStsA/GlobalTileTraits::Threads::kW *kScalarsIn4BSharedStoreTileTraits
 The traits class to build the iterator to store data to shared memory for A^T. More...
 
typedef GemmSharedLoadTileATraits< MultiplyAddScalar const, typename GemmConfig_::OutputTile, typename GemmConfig_::Warps, typename GemmConfig_::MultiplyAdd::ThreadsPerWarp, typename GemmConfig_::InstructionShape, GemmConfig_::kStages, GemmConfig_::kScalarsPerLdsA, SharedStoreTileTraits::kSkew > SharedLoadTileTraits
 The traits class to build the iterator to load from shared memory for A^T. More...
 

Additional Inherited Members

- Static Public Attributes inherited from cutlass::gemm::GemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >
static MatrixLayout::Kind const kLayout = MatrixLayout::kRowMajor
 The layout. More...
 
static int const kScalarsIn4B = sizeof(MultiplyAddScalar) > 4 ? 1 : 4 / sizeof(MultiplyAddScalar)
 The number of scalars in 4B. More...
 

Member Typedef Documentation

◆ Base

template<typename GemmConfig_ >
typedef GemmTileTraitsHelperA<MatrixLayout::kRowMajor, GemmConfig_> cutlass::gemm::HgemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >::Base

◆ GlobalTileTraits

template<typename GemmConfig_ >
typedef HgemmCrosswiseGlobalTileTraits< GemmOperand::kA, MatrixLayout::kRowMajor, half const, Shape<1, GemmConfig_::OutputTile::kW, GemmConfig_::OutputTile::kD>, Shape<1, GemmConfig_::kThreads / GemmConfig_::OutputTile::kD, GemmConfig_::OutputTile::kD>, GemmConfig_::kScalarsPerLdgA> cutlass::gemm::HgemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >::GlobalTileTraits

◆ SharedLoadTileTraits

template<typename GemmConfig_ >
typedef GemmSharedLoadTileATraits< half const, typename GemmConfig_::OutputTile, typename GemmConfig_::Warps, typename GemmConfig_::MultiplyAdd::ThreadsPerWarp, typename GemmConfig_::InstructionShape, GemmConfig_::kStages, 8, SharedStoreTileTraits::kSkew> cutlass::gemm::HgemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >::SharedLoadTileTraits

◆ SharedStoreTileTraits

template<typename GemmConfig_ >
typedef GemmSharedStoreWithSkewTileAbTraits< half, Shape<GemmConfig_::kStages, GemmConfig_::OutputTile::kD / GemmConfig_::InstructionShape::kD, GemmConfig_::OutputTile::kW * GemmConfig_::InstructionShape::kD>, typename GlobalTileTraits::Threads, 2, 128 / sizeof(half) / GlobalTileTraits::Threads::kW / 2> cutlass::gemm::HgemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >::SharedStoreTileTraits

The documentation for this struct was generated from the following file: