#include <gemm_shared_tile.h>
|
typedef platform::remove_const< Scalar_ >::type | Scalar |
| The scalar. More...
|
|
typedef Scalar_ * | Pointer |
| The pointer. More...
|
|
typedef OutputTile_ | OutputTile |
| The dimension of the output tile. More...
|
|
typedef Warps_ | Warps |
| The warps in the tile. More...
|
|
typedef ThreadsPerWarp_ | ThreadsPerWarp |
| The threads in the warps. More...
|
|
typedef Shape< 1, 2, kScalarsPerRow/kAccessSize, kAccessSize > | Tile |
|
typedef Shape< kIterationsD, kIterationsH, OutputTile::kW/kWarpSize/kAccessSize, Warps::kD > | Iterations |
| The number of iterations needed to store the tile. More...
|
|
typedef Shape< OutputTile::kW, kScalarsPerRow, kWarpSize *kAccessSize, kSplitK > | ImmediateOffsetStrides |
| The strides in each dimension between different loads/stores. More...
|
|
typedef Shape< OutputTile::kW, kScalarsPerRow, kWarpSize *kAccessSize, kSplitK > | Delta |
| The strides in each dimension between different loads/stores. More...
|
|
◆ Delta
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ ImmediateOffsetStrides
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ Iterations
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ OutputTile
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ Pointer
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ Scalar
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ ThreadsPerWarp
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ Tile
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
The tile. We have 2 rows of scalars. We use those two rows to make sure we do not have bank conflicts in the epilogue.
◆ Warps
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kAccessSize
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kIterationsD
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kIterationsH
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kIterationsInHPerWarp
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kMemorySpace
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kScalarsPerRow
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kScalarsPerThread
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
int const cutlass::gemm::GemmSharedLoadTileDTraits< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kScalarsPerThread = OutputTile_::kW / Warps::kW / ThreadsPerWarp::kW |
|
static |
◆ kSkew
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kSplitK
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kThreads
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
The documentation for this struct was generated from the following file: