Cutlass
CUDA Templates for Linear Algebra Subroutines and Solvers
|
#include <igemm_global_tile.h>
Classes | |
struct | ThreadOffset |
Computes the thread offset in (H, W) based on thread ID. More... | |
Public Types | |
typedef GemmGlobalTileTraits< kOperand_, kLayout_, Scalar_, Tile_, Threads_, kAccessSize_ > | Base |
The base class. More... | |
typedef Base::Threads | Threads |
The threads. More... | |
typedef Shape< Base::Threads::kH *4, 1, Base::Threads::kW, Base::kAccessSize > | Delta |
The strides in each dimension between different loads/stores. More... | |
typedef Shape< Base::Tile::kH/Base::Threads::kH/4, 4, Base::Tile::kW/Base::Threads::kW, Base::Tile::kC/Base::kAccessSize > | Iterations |
The number of iterations needed to load/store the tile. More... | |
typedef Shape< 1, 4, Base::Tile::kC > | ThreadsDelta |
The threads strides. More... | |
![]() | |
typedef platform::remove_const< Scalar_ >::type | Scalar |
The scalar. More... | |
typedef Scalar_ * | Pointer |
The pointer. More... | |
typedef ReshapeTile< Tile_, kAccessSize_ >::Tile | Tile |
The tile shape. More... | |
typedef ReshapeThreads< Tile, Threads_ >::Threads | Threads |
The threads shape. More... | |
typedef Shape< 1, 1, Tile::kC > | ThreadsDelta |
The relative offset between two elements in the H/W dimension in adjacent threads. More... | |
typedef Shape< 0, Threads::kH, Threads::kW *kAccessSize > | Delta |
The strides in each dimension between different loads/stores. More... | |
typedef Shape< 0, 0, Threads::kW *ThreadsDelta::kW, kAccessSize > | ImmediateOffsetStrides |
Strides for immediate offset computation. More... | |
typedef Shape< 1, Tile::kH/Threads::kH, Tile::kW/Threads::kW, Tile::kC/kAccessSize > | Iterations |
The number of iterations needed to load/store the tile. More... | |
typedef GemmMultiplicandTraits< Tile, kOperand, kLayout > | MultiplicandTraits |
Additional Inherited Members | |
![]() | |
static GemmOperand::Kind const | kOperand = kOperand_ |
Identity of the operand. More... | |
static MatrixLayout::Kind const | kLayout = kLayout_ |
The layout. More... | |
static int const | kAccessSize = kAccessSize_ |
The number of scalars per LDG/STG. More... | |
static MemorySpace::Kind const | kMemorySpace = MemorySpace::kGlobal |
The memory space. More... | |
typedef GemmGlobalTileTraits<kOperand_, kLayout_, Scalar_, Tile_, Threads_, kAccessSize_> cutlass::gemm::IgemmContiguousGlobalTileTraits< kOperand_, kLayout_, Scalar_, Tile_, Threads_, kAccessSize_ >::Base |
typedef Shape<Base::Threads::kH * 4, 1, Base::Threads::kW, Base::kAccessSize> cutlass::gemm::IgemmContiguousGlobalTileTraits< kOperand_, kLayout_, Scalar_, Tile_, Threads_, kAccessSize_ >::Delta |
typedef Shape<Base::Tile::kH / Base::Threads::kH / 4, 4, Base::Tile::kW / Base::Threads::kW, Base::Tile::kC / Base::kAccessSize> cutlass::gemm::IgemmContiguousGlobalTileTraits< kOperand_, kLayout_, Scalar_, Tile_, Threads_, kAccessSize_ >::Iterations |
typedef Base::Threads cutlass::gemm::IgemmContiguousGlobalTileTraits< kOperand_, kLayout_, Scalar_, Tile_, Threads_, kAccessSize_ >::Threads |
typedef Shape<1, 4, Base::Tile::kC> cutlass::gemm::IgemmContiguousGlobalTileTraits< kOperand_, kLayout_, Scalar_, Tile_, Threads_, kAccessSize_ >::ThreadsDelta |