template<typename FloatN, int M, typename SpinorX, typename SpinorY, typename SpinorZ, typename SpinorW, typename Functor>
class BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >
Definition at line 49 of file blas_core.cuh.
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| virtual bool BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::advanceSharedBytes |
( |
TuneParam & |
param | ) |
const |
|
inlineprivatevirtual |
Definition at line 66 of file blas_core.cuh.
References param, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::sharedBytesPerBlock(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::sharedBytesPerThread().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| void BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::apply |
( |
const cudaStream_t & |
stream | ) |
|
|
inline |
Definition at line 88 of file blas_core.cuh.
References BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::arg, getTuning(), getVerbosity(), stream, and quda::tuneLaunch().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| long long BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::bytes |
( |
| ) |
const |
|
inline |
Definition at line 118 of file blas_core.cuh.
References BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::arg, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::nParity, QUDA_HALF_PRECISION, and value.
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| void BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::defaultTuneParam |
( |
TuneParam & |
param | ) |
const |
|
inline |
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| long long BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::flops |
( |
| ) |
const |
|
inline |
Definition at line 117 of file blas_core.cuh.
References BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::arg, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::nParity, and value.
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| void BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::initTuneParam |
( |
TuneParam & |
param | ) |
const |
|
inline |
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| void BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune |
( |
| ) |
|
|
inline |
Definition at line 100 of file blas_core.cuh.
References BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::arg, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::bytes_, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::norm_bytes_, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::W_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Wnorm_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::X_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Xnorm_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Y_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Ynorm_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Z_h, and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Znorm_h.
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| void BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune |
( |
| ) |
|
|
inline |
Definition at line 93 of file blas_core.cuh.
References BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::arg, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::bytes_, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::norm_bytes_, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::W_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Wnorm_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::X_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Xnorm_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Y_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Ynorm_h, BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Z_h, and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Znorm_h.
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| unsigned int BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::sharedBytesPerBlock |
( |
const TuneParam & |
param | ) |
const |
|
inlineprivate |
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| unsigned int BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::sharedBytesPerThread |
( |
| ) |
const |
|
inlineprivate |
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| TuneKey BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::tuneKey |
( |
| ) |
const |
|
inline |
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| BlasArg<SpinorX,SpinorY,SpinorZ,SpinorW,Functor> BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::arg |
|
mutableprivate |
Definition at line 52 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::apply(), BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::bytes(), BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::flops(), BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::tuneKey().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| const size_t* BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::bytes_ |
|
private |
Definition at line 60 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| const size_t* BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::norm_bytes_ |
|
private |
Definition at line 61 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| const int BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::nParity |
|
private |
Definition at line 54 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::bytes(), BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::defaultTuneParam(), BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::flops(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::initTuneParam().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| char * BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::W_h |
|
private |
Definition at line 58 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| char * BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Wnorm_h |
|
private |
Definition at line 59 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| char* BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::X_h |
|
private |
Definition at line 58 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| char* BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Xnorm_h |
|
private |
Definition at line 59 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| char * BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Y_h |
|
private |
Definition at line 58 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| char * BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Ynorm_h |
|
private |
Definition at line 59 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| char * BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Z_h |
|
private |
Definition at line 58 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().
template<typename FloatN , int M, typename SpinorX , typename SpinorY , typename SpinorZ , typename SpinorW , typename Functor >
| char * BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::Znorm_h |
|
private |
Definition at line 59 of file blas_core.cuh.
Referenced by BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::postTune(), and BlasCuda< FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Functor >::preTune().