Cutlass
CUDA Templates for Linear Algebra Subroutines and Solvers
|
#include <gemm_traits.h>
Public Types | |
typedef GemmConfig_::ScalarA | Scalar |
The input scalar. More... | |
typedef GemmConfig_::MultiplyAdd::ScalarA | MultiplyAddScalar |
The scalar stored in shared memory. More... | |
typedef GemmGlobalTileTraits< GemmOperand::kA, MatrixLayout::kRowMajor, Scalar const, Shape< 1, GemmConfig_::OutputTile::kW, GemmConfig_::OutputTile::kD >, Shape< 1, GemmConfig_::kThreads/GemmConfig_::OutputTile::kD, GemmConfig_::OutputTile::kD >, GemmConfig_::kScalarsPerLdgA > | GlobalTileTraits |
The traits class to build the iterator to load data from global memory for A^T. More... | |
Static Public Attributes | |
static MatrixLayout::Kind const | kLayout = MatrixLayout::kRowMajor |
The layout. More... | |
static int const | kScalarsIn4B = sizeof(MultiplyAddScalar) > 4 ? 1 : 4 / sizeof(MultiplyAddScalar) |
The number of scalars in 4B. More... | |
static int const | kSkewA |
The skew for A. More... | |
typedef GemmGlobalTileTraits< GemmOperand::kA, MatrixLayout::kRowMajor, Scalar const, Shape<1, GemmConfig_::OutputTile::kW, GemmConfig_::OutputTile::kD>, Shape<1, GemmConfig_::kThreads / GemmConfig_::OutputTile::kD, GemmConfig_::OutputTile::kD>, GemmConfig_::kScalarsPerLdgA> cutlass::gemm::GemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >::GlobalTileTraits |
typedef GemmConfig_::MultiplyAdd::ScalarA cutlass::gemm::GemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >::MultiplyAddScalar |
typedef GemmConfig_::ScalarA cutlass::gemm::GemmTileTraitsHelperA< MatrixLayout::kRowMajor, GemmConfig_ >::Scalar |
|
static |
|
static |
|
static |