Cutlass
CUDA Templates for Linear Algebra Subroutines and Solvers
|
#include <tile_traits_standard.h>
Public Types | |
typedef Tile_ | Tile |
Shape of tile. More... | |
typedef Shape< 1, 1, kThreads > | ThreadShape |
Thread shape. More... | |
typedef Shape< 1, 1, kThreads > | Delta |
Delta between each thread's access. More... | |
typedef Shape< 1, Tile::kH, Tile::kW/kThreads > | Iterations |
Number of iterations. More... | |
typedef TiledThreadOffset< ThreadShape > | ThreadOffset |
Computes the initial offset. More... | |
Static Public Attributes | |
static int const | kThreads = Threads |
Number of participating threads. More... | |
Tiling in which the number of threads is fewer than the tile size in the contiguous dimension.
typedef Shape<1, 1, kThreads> cutlass::TileTraitsContiguousMajor< Tile_, Threads >::Delta |
typedef Shape<1, Tile::kH, Tile::kW / kThreads> cutlass::TileTraitsContiguousMajor< Tile_, Threads >::Iterations |
typedef TiledThreadOffset<ThreadShape> cutlass::TileTraitsContiguousMajor< Tile_, Threads >::ThreadOffset |
typedef Shape<1, 1, kThreads> cutlass::TileTraitsContiguousMajor< Tile_, Threads >::ThreadShape |
typedef Tile_ cutlass::TileTraitsContiguousMajor< Tile_, Threads >::Tile |
|
static |