|
Cutlass
CUDA Templates for Linear Algebra Subroutines and Solvers
|
#include <igemm_swizzle.h>
Public Types | |
| typedef GlobalIterator_ | GlobalIterator |
| The global iterator. More... | |
| typedef GlobalIterator::Fragment | Fragment |
| The source fragment. More... | |
| typedef GlobalIterator::FragmentShape | FragmentShape |
| The shape of the source fragment. More... | |
| typedef Fragment | InputFragment |
| The source fragment. More... | |
| typedef Fragment | OutputFragment |
| The destination fragment. More... | |
Public Member Functions | |
| CUTLASS_DEVICE | IgemmSwizzle () |
| The src/dst must be int8 fragments. More... | |
| CUTLASS_DEVICE void | transform (Fragment const &src, Fragment &dst) |
| Transform a fragment. More... | |
| typedef GlobalIterator::Fragment cutlass::gemm::IgemmSwizzle< GlobalIterator_ >::Fragment |
| typedef GlobalIterator::FragmentShape cutlass::gemm::IgemmSwizzle< GlobalIterator_ >::FragmentShape |
| typedef GlobalIterator_ cutlass::gemm::IgemmSwizzle< GlobalIterator_ >::GlobalIterator |
| typedef Fragment cutlass::gemm::IgemmSwizzle< GlobalIterator_ >::InputFragment |
| typedef Fragment cutlass::gemm::IgemmSwizzle< GlobalIterator_ >::OutputFragment |
|
inline |
The number of elements must be a multiple of 4. Ctor.
|
inline |
1.8.14