Cutlass
CUDA Templates for Linear Algebra Subroutines and Solvers
|
Defines a 1D vector of elements held in the registers of each thread. More...
Go to the source code of this file.
Namespaces | |
cutlass | |
Functions | |
template<> | |
struct | cutlass::__align__ (1) AlignedStruct< 1 > |
template<> | |
struct | cutlass::__align__ (2) AlignedStruct< 2 > |
template<> | |
struct | cutlass::__align__ (4) AlignedStruct< 4 > |
template<> | |
struct | cutlass::__align__ (8) AlignedStruct< 8 > |
template<> | |
struct | cutlass::__align__ (16) AlignedStruct< 16 > |
template<> | |
struct | cutlass::__align__ (32) AlignedStruct< 32 > |
template<> | |
struct | cutlass::__align__ (64) AlignedStruct< 64 > |
template<typename Scalar_ > | |
CUTLASS_HOST_DEVICE void | cutlass::make_zero (Scalar_ &x) |
template<typename Scalar_ , int kLanes_> | |
CUTLASS_HOST_DEVICE void | cutlass::make_zero (Vector< Scalar_, kLanes_ > &vec) |