#include <gemm.h>
|
CUTLASS_DEVICE | Gemm (Params const ¶ms_, SharedStorage &shared_storage_) |
| Ctor. More...
|
|
template<bool Residue, bool LastIteration> |
CUTLASS_DEVICE void | consume_tile (typename Traits::GlobalLoadStream &global_to_shared_stream, typename Traits::SharedStream &shared_load_stream, typename MultiplyAdd::Accumulators &accumulators, Index outer_k) |
| Computes a warp-level GEMM on data held in shared memory. More...
|
|
CUTLASS_DEVICE void | multiply_add () |
| Do the GEMM. More...
|
|
◆ Index
template<typename GemmTraits_ >
◆ MultiplyAdd
template<typename GemmTraits_ >
◆ Params
template<typename GemmTraits_ >
◆ ScalarA
template<typename GemmTraits_ >
◆ ScalarB
template<typename GemmTraits_ >
◆ ScalarC
template<typename GemmTraits_ >
◆ ScalarD
template<typename GemmTraits_ >
◆ ScalarEpilogue
template<typename GemmTraits_ >
◆ SharedStorage
template<typename GemmTraits_ >
◆ This_
template<typename GemmTraits_ >
◆ Traits
template<typename GemmTraits_ >
◆ Gemm()
template<typename GemmTraits_ >
◆ consume_tile()
template<typename GemmTraits_ >
template<bool Residue, bool LastIteration>
CUTLASS_DEVICE void cutlass::gemm::Gemm< GemmTraits_ >::consume_tile |
( |
typename Traits::GlobalLoadStream & |
global_to_shared_stream, |
|
|
typename Traits::SharedStream & |
shared_load_stream, |
|
|
typename MultiplyAdd::Accumulators & |
accumulators, |
|
|
Index |
outer_k |
|
) |
| |
|
inline |
◆ launch() [1/2]
template<typename GemmTraits_ >
static __host__ cudaError_t cutlass::gemm::Gemm< GemmTraits_ >::launch |
( |
Params const & |
params, |
|
|
cudaStream_t |
stream = cudaStreamDefault |
|
) |
| |
|
inlinestatic |
◆ launch() [2/2]
template<typename GemmTraits_ >
static __host__ cudaError_t cutlass::gemm::Gemm< GemmTraits_ >::launch |
( |
CUfunction |
kernel, |
|
|
Params const & |
params, |
|
|
CUstream |
stream = CU_STREAM_LEGACY |
|
) |
| |
|
inlinestatic |
◆ multiply_add()
template<typename GemmTraits_ >
◆ kThreads
template<typename GemmTraits_ >
◆ kWarpGemmSteps
template<typename GemmTraits_ >
Initial value:=
Traits::GemmConfig::AccumulatorsPerWarp::kD / MultiplyAdd::InstructionShape::kD
◆ params
template<typename GemmTraits_ >
◆ shared_storage
template<typename GemmTraits_ >
The documentation for this struct was generated from the following file: