|
typedef GemmEpilogueTraitsHelper< IgemmConfig_, EpilogueFunctor_, Index_ > | Base |
| The base class. More...
|
|
typedef IgemmConfig_ | IgemmConfig |
| The config. More...
|
|
typedef Base::Scalar | Scalar |
| The scalar type of the epilogue. More...
|
|
typedef Base::Iterations | Iterations |
| The iterations. More...
|
|
typedef Base::Delta | Delta |
| The iterations strides. More...
|
|
typedef Base::GlobalLoadTileTraits | GlobalLoadTileTraits |
| The traits class for the iterator. More...
|
|
typedef GemmGlobalIteratorCd< GlobalLoadTileTraits > | GlobalLoadIteratorC |
| The iterator to store to shared memory. More...
|
|
typedef GlobalLoadIteratorC::Fragment | GlobalFragmentC |
| The fragment that needs to be produced by the load iterator. More...
|
|
typedef IgemmGlobalLoadTransformer< GlobalFragmentC, Scalar >::Transformer | GlobalTransformerC |
| The transformer from loaded data to math fragment. More...
|
|
typedef Base::GlobalStoreTileTraits | GlobalStoreTileTraits |
| The traits class for the iterator. More...
|
|
typedef GemmGlobalIteratorCd< GlobalStoreTileTraits > | GlobalStoreIteratorD |
| The iterator to store to shared memory. More...
|
|
typedef GlobalStoreIteratorD::Fragment | GlobalFragmentD |
| The fragment that needs to be passed to that store iterator. More...
|
|
typedef IgemmGlobalStoreTransformer< Scalar, GlobalFragmentD >::Transformer | GlobalTransformerD |
| The transformer from accumulators to shared memory fragments. More...
|
|
typedef Base::SharedStoreTileTraits | SharedStoreTileTraits |
| The traits class for the shared iterator to store D to shared memory. More...
|
|
typedef TileStoreIterator< SharedStoreTileTraits, typename SharedStoreTileTraits::Scalar, IteratorAdvance::kH, MemorySpace::kGlobal > | SharedStoreIteratorD |
| The shared iterator to store D to shared memory. More...
|
|
typedef SharedStoreIteratorD::Fragment | SharedStoreFragmentD |
| The fragment that needs to be passed to that store iterator. More...
|
|
typedef IgemmSharedStoreTransformer< typename IgemmConfig::Accumulators::Element, SharedStoreFragmentD >::Transformer | SharedStoreTransformerD |
| The transformer from accumulators to shared memory fragments. More...
|
|
typedef Base::SharedLoadTileTraits | SharedLoadTileTraits |
| The traits class for the shared iterator to load D from shared memory. More...
|
|
typedef TileLoadIterator< SharedLoadTileTraits, typename SharedLoadTileTraits::Scalar, IteratorAdvance::kH, MemorySpace::kShared > | SharedLoadIteratorD |
| The shared iterator to load D from shared memory. More...
|
|
typedef EpilogueFunctor_::Scalar | Scalar |
| The scalar. More...
|
|
typedef IgemmConfig_ ::OutputTile | OutputTile |
| The output tile. More...
|
|
typedef Shape< 1, IgemmConfig_ ::MultiplyAdd::AccumulatorsPerThread::kH/IgemmConfig_ ::kAccumulatorsPerLdsB, IgemmConfig_ ::kAccumulatorsPerLdsB > | Iterations |
| The number of iterations in the epilogue. More...
|
|
typedef Shape< 0, IgemmConfig_ ::kAccumulatorsPerLdsB *(IgemmConfig_ ::Warps::kH *IgemmConfig_ ::MultiplyAdd::ThreadsPerWarp::kH - 1), 0 > | Delta |
|
typedef EpilogueFunctor_ | Functor |
| The functor to do the math in the epilogue. More...
|
|
typedef GemmSharedStoreTileDTraits< typename Functor::ScalarAccum, typename IgemmConfig_ ::OutputTile, typename IgemmConfig_ ::Warps, typename IgemmConfig_ ::MultiplyAdd::ThreadsPerWarp, IgemmConfig_ ::kScalarsPerStsD, 128/sizeof(typename IgemmConfig_ ::ScalarD)/IgemmConfig_ ::kScalarsPerStsD/2 *IgemmConfig_ ::kScalarsPerStsD > | SharedStoreTileTraits |
| The traits class to build the iterator to store to shared memory for D. More...
|
|
typedef TileStoreIterator< SharedStoreTileTraits, typename SharedStoreTileTraits::Scalar, IteratorAdvance::kH, MemorySpace::kShared > | SharedStoreIteratorD |
| The iterator to store D to shared memory. More...
|
|
typedef Copy< typename SharedStoreIteratorD::Fragment > | SharedStoreTransformerD |
| The shared store transformer for D. More...
|
|
typedef GemmSharedLoadTileDTraits< typename Functor::ScalarAccum, typename IgemmConfig_ ::OutputTile, typename IgemmConfig_ ::Warps, typename IgemmConfig_ ::MultiplyAdd::ThreadsPerWarp, IgemmConfig_ ::OutputTile::kH/ShapeCount< Iterations >::kCount, IgemmConfig_ ::kScalarsPerLdsD, SharedStoreTileTraits::kSkew > | SharedLoadTileTraits |
| The traits class to build the iterator to load from shared memory for D. More...
|
|
typedef TileLoadIterator< SharedLoadTileTraits, typename SharedLoadTileTraits::Scalar, IteratorAdvance::kH, MemorySpace::kShared > | SharedLoadIteratorD |
| The iterator to load D from shared memory. More...
|
|
typedef SharedLoadStream< SharedLoadIteratorD > | SharedLoadStreamD |
| The stream to load D. More...
|
|
typedef GemmGlobalTileCdTraits< typename IgemmConfig_ ::ScalarC const, Shape< 1, IgemmConfig_ ::OutputTile::kH/ShapeCount< Iterations >::kCount, IgemmConfig_ ::OutputTile::kW >, Shape< 1, ShapeCount< typename IgemmConfig_ ::Warps >::kCount, IgemmConfig_ ::kWarpSize >, Iterations::kW, IgemmConfig_ ::kScalarsPerLdgC > | GlobalLoadTileTraits |
| The traits class to build the iterator to load data from global memory for C^N. More...
|
|
typedef GemmGlobalIteratorCd< GlobalLoadTileTraits, Index_ > | GlobalLoadIteratorC |
| The iterator to load C. More...
|
|
typedef Copy< typename GlobalLoadIteratorC::Fragment > | GlobalTransformerC |
| The transformer for C. More...
|
|
typedef GemmGlobalTileCdTraits< typename IgemmConfig_ ::ScalarD, Shape< 1, IgemmConfig_ ::OutputTile::kH/ShapeCount< Iterations >::kCount, IgemmConfig_ ::OutputTile::kW >, Shape< 1, ShapeCount< typename IgemmConfig_ ::Warps >::kCount, IgemmConfig_ ::kWarpSize >, Iterations::kW, IgemmConfig_ ::kScalarsPerStgD > | GlobalStoreTileTraits |
| The traits class to build the iterator to store data to global memory for D^N. More...
|
|
typedef GemmGlobalIteratorCd< GlobalStoreTileTraits, Index_ > | GlobalStoreIteratorD |
| The iterator to store D. More...
|
|
typedef Copy< typename GlobalStoreIteratorD::Fragment > | GlobalTransformerD |
| The transformer for D. More...
|
|