#include <gemm_shared_tile.h>
|
| typedef platform::remove_const< Scalar_ >::type | Scalar |
| | The scalar. More...
|
| |
| typedef Scalar_ * | Pointer |
| | The pointer. More...
|
| |
| typedef OutputTile_ | OutputTile |
| | The dimension of the output tile. More...
|
| |
| typedef Warps_ | Warps |
| | The warps in the tile. More...
|
| |
| typedef ThreadsPerWarp_ | ThreadsPerWarp |
| | The threads in the warps. More...
|
| |
| typedef Shape< 1, 2, kScalarsPerRow/kAccessSize, kAccessSize > | Tile |
| |
| typedef Shape< kIterationsD, kIterationsH, OutputTile::kW/kWarpSize/kAccessSize, Warps::kD > | Iterations |
| | The number of iterations needed to store the tile. More...
|
| |
| typedef Shape< OutputTile::kW, kScalarsPerRow, kWarpSize *kAccessSize, kSplitK > | ImmediateOffsetStrides |
| | The strides in each dimension between different loads/stores. More...
|
| |
| typedef Shape< OutputTile::kW, kScalarsPerRow, kWarpSize *kAccessSize, kSplitK > | Delta |
| | The strides in each dimension between different loads/stores. More...
|
| |
◆ Delta
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ ImmediateOffsetStrides
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ Iterations
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ OutputTile
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ Pointer
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ Scalar
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ ThreadsPerWarp
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ Tile
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
The tile. We have 2 rows of scalars. We use those two rows to make sure we do not have bank conflicts in the epilogue.
◆ Warps
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kAccessSize
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kIterationsD
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kIterationsH
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kIterationsInHPerWarp
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kMemorySpace
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kScalarsPerRow
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kScalarsPerThread
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
| int const cutlass::gemm::GemmSharedLoadTileDTraits< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kScalarsPerThread = OutputTile_::kW / Warps::kW / ThreadsPerWarp::kW |
|
static |
◆ kSkew
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kSplitK
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
◆ kThreads
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0>
The documentation for this struct was generated from the following file: