Cutlass
CUDA Templates for Linear Algebra Subroutines and Solvers
List of all members
cutlass::gemm::HgemmTraits< kLayoutA_, kLayoutB_, OutputTile_, EpilogueFunctor_, ThreadGemmShape_, kScalarsPerLdgA_, kScalarsPerLdgB_, Index_, Helper_ > Struct Template Reference

#include <hgemm_traits.h>

Inheritance diagram for cutlass::gemm::HgemmTraits< kLayoutA_, kLayoutB_, OutputTile_, EpilogueFunctor_, ThreadGemmShape_, kScalarsPerLdgA_, kScalarsPerLdgB_, Index_, Helper_ >:
cutlass::gemm::GemmTraits< Helper_::GemmConfig, Helper_::GlobalLoadStreamA, Helper_::GlobalLoadStreamB, Helper_::SharedLoadStreamA, Helper_::SharedLoadStreamB, Helper_::Epilogue, IdentityBlockSwizzle, Index_, Helper_::ClearAccumulators >

Additional Inherited Members

- Public Types inherited from cutlass::gemm::GemmTraits< Helper_::GemmConfig, Helper_::GlobalLoadStreamA, Helper_::GlobalLoadStreamB, Helper_::SharedLoadStreamA, Helper_::SharedLoadStreamB, Helper_::Epilogue, IdentityBlockSwizzle, Index_, Helper_::ClearAccumulators >
typedef GemmTraits< Helper_::GemmConfig, Helper_::GlobalLoadStreamA, Helper_::GlobalLoadStreamB, Helper_::SharedLoadStreamA, Helper_::SharedLoadStreamB, Helper_::Epilogue, IdentityBlockSwizzle, Index_, Helper_::ClearAccumulators > This_
 This traits. More...
 
typedef cutlass::gemm::Gemm< This_KernelClass
 The struct that consumes this Traits. More...
 
typedef Helper_::GemmConfig GemmConfig
 The configuration. More...
 
typedef GemmConfig::OutputTile OutputTile
 The output tile. More...
 
typedef Helper_::GlobalLoadStreamA GlobalLoadStreamA
 The stream to load A from global memory to shared memory. More...
 
typedef Helper_::GlobalLoadStreamA ::Scalar ScalarA
 The scalar for A. More...
 
typedef Helper_::GlobalLoadStreamB GlobalLoadStreamB
 The stream to load B from global memory to shared memory. More...
 
typedef Helper_::GlobalLoadStreamB ::Scalar ScalarB
 The scalar for B. More...
 
typedef Helper_::SharedLoadStreamA SharedLoadStreamA
 The iterator for A to load from shared memory. More...
 
typedef Helper_::SharedLoadStreamB SharedLoadStreamB
 The iterator for B to load from shared memory. More...
 
typedef GemmConfig::MultiplyAdd MultiplyAdd
 The multiply-add functor. More...
 
typedef Helper_::Epilogue Epilogue
 The epilogue. More...
 
typedef Epilogue::ScalarC ScalarC
 The scalars in the epilogue. More...
 
typedef Epilogue::ScalarD ScalarD
 
typedef IdentityBlockSwizzle BlockSwizzle
 The block swizzle to reorganize the grid. More...
 
typedef Index_ Index
 The index. More...
 
typedef Helper_::ClearAccumulators ClearAccumulators
 Clear the accumulators. More...
 
typedef GlobalLoadStreamPair< GlobalLoadStreamA, GlobalLoadStreamB, GemmConfig::kResidueInProlog > GlobalLoadStream
 Assemble the global load streams for A/B. More...
 
typedef GlobalLoadStream::ThreadblockTileStorage ThreadblockTileStorage
 Memory needed to store the threadblock-scoped GEMM tile. More...
 
typedef SharedStreamPair< SharedLoadStreamA, SharedLoadStreamBSharedStream
 Assemble the shared load streams for A/B. More...
 
- Static Public Member Functions inherited from cutlass::gemm::GemmTraits< Helper_::GemmConfig, Helper_::GlobalLoadStreamA, Helper_::GlobalLoadStreamB, Helper_::SharedLoadStreamA, Helper_::SharedLoadStreamB, Helper_::Epilogue, IdentityBlockSwizzle, Index_, Helper_::ClearAccumulators >
static CUTLASS_DEVICE void shared_load_fence (bool in_loop)
 The memory fence for shared loads. More...
 
static CUTLASS_DEVICE void shared_store_fence (bool in_loop)
 The memory fence for shared stores. More...
 
- Static Public Attributes inherited from cutlass::gemm::GemmTraits< Helper_::GemmConfig, Helper_::GlobalLoadStreamA, Helper_::GlobalLoadStreamB, Helper_::SharedLoadStreamA, Helper_::SharedLoadStreamB, Helper_::Epilogue, IdentityBlockSwizzle, Index_, Helper_::ClearAccumulators >
static MatrixLayout::Kind const kLayoutA
 The layout of A. More...
 
static MatrixLayout::Kind const kLayoutB
 The layout of B. More...
 

The documentation for this struct was generated from the following file: