Template performing matrix multiply-add operation within a thread.
#include <thread_multiply_add.h>
◆ Accumulators
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ AccumulatorsPerThread
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ AccumulatorsPerWarp
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ FragmentA
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ FragmentB
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ InstructionShape
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ ScalarA
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ ScalarB
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ ScalarC
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ ThreadGemmShape
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ ThreadsPerWarp
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ ThreadMultiplyAdd()
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
◆ multiply_add()
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor>
The documentation for this struct was generated from the following file: