Cutlass
CUDA Templates for Linear Algebra Subroutines and Solvers
Classes | Namespaces
igemm_epilogue.h File Reference

Defines the epilogue phase of the GEMM computation for IGEMM, supporting integer and floating-point output matrix formats. More...

#include "cutlass/convert.h"
#include "cutlass/fragment.h"
#include "cutlass/gemm/gemm_global_stream.h"
#include "cutlass/gemm/gemm_shared_stream.h"
#include "cutlass/gemm/igemm_global_tile.h"
#include "cutlass/reshape_tile.h"
#include "cutlass/tile_iterator.h"

Go to the source code of this file.

Classes

struct  cutlass::gemm::IgemmFloatToInt8Converter< kElements_ >
 
struct  cutlass::gemm::IgemmGlobalStoreTransformer< InputScalar_, OutputFragment_ >
 
struct  cutlass::gemm::IgemmGlobalStoreTransformer< float, Fragment< int8_t, kElements_ > >
 
struct  cutlass::gemm::IgemmInt8ToFloatConverter< kElements_ >
 
struct  cutlass::gemm::IgemmGlobalLoadTransformer< InputFragment_, OutputScalar_ >
 
struct  cutlass::gemm::IgemmGlobalLoadTransformer< Fragment< int8_t, kElements_ >, float >
 
struct  cutlass::gemm::IgemmSharedStoreTransformer< InputScalar_, OutputFragment_ >
 
struct  cutlass::gemm::IgemmEpilogueTraitsHelper< IgemmConfig_, EpilogueFunctor_, Index_ >
 
struct  cutlass::gemm::IgemmEpilogueTraits< IgemmConfig_, EpilogueFunctor_, Index_, Helper_ >
 
struct  cutlass::gemm::IgemmEpilogue< GemmEpilogueTraits_, bool >
 
struct  cutlass::gemm::IgemmEpilogue< GemmEpilogueTraits_, true >
 

Namespaces

 cutlass
 
 cutlass::gemm