QUDA
1.0.0
|
Public Member Functions | |
__device__ __host__ | Gamma () |
__device__ __host__ | Gamma (const Gamma &g) |
__device__ __host__ int | getcol (int row) const |
__device__ __host__ complex< ValueType > | getelem (int row) const |
__device__ __host__ complex< ValueType > | getelem (int row, int col) const |
__device__ __host__ complex< ValueType > | getrowelem (int row, int &col) const |
__device__ __host__ complex< ValueType > | apply (int row, const complex< ValueType > &a) const |
constexpr int | Dir () const |
Gamma (Arg &arg, const ColorSpinorField &meta) | |
virtual | ~Gamma () |
void | apply (const cudaStream_t &stream) |
TuneKey | tuneKey () const |
void | preTune () |
void | postTune () |
![]() | |
TunableVectorY (unsigned int vector_length_y) | |
bool | advanceBlockDim (TuneParam ¶m) const |
void | initTuneParam (TuneParam ¶m) const |
void | defaultTuneParam (TuneParam ¶m) const |
void | resizeVector (int y) const |
void | resizeStep (int y) const |
![]() | |
Tunable () | |
virtual | ~Tunable () |
virtual int | tuningIter () const |
virtual std::string | paramString (const TuneParam ¶m) const |
virtual std::string | perfString (float time) const |
virtual bool | advanceTuneParam (TuneParam ¶m) const |
void | checkLaunchParam (TuneParam ¶m) |
CUresult | jitifyError () const |
CUresult & | jitifyError () |
Protected Member Functions | |
long long | flops () const |
long long | bytes () const |
bool | tuneGridDim () const |
unsigned int | minThreads () const |
![]() | |
virtual unsigned int | sharedBytesPerThread () const |
virtual unsigned int | sharedBytesPerBlock (const TuneParam ¶m) const |
![]() | |
virtual bool | tuneAuxDim () const |
virtual bool | tuneSharedBytes () const |
virtual bool | advanceGridDim (TuneParam ¶m) const |
virtual unsigned int | maxBlockSize (const TuneParam ¶m) const |
virtual unsigned int | maxGridSize () const |
virtual unsigned int | minGridSize () const |
virtual int | gridStep () const |
gridStep sets the step size when iterating the grid size in advanceGridDim. More... | |
virtual int | blockStep () const |
virtual int | blockMin () const |
virtual void | resetBlockDim (TuneParam ¶m) const |
unsigned int | maxBlocksPerSM () const |
For some reason this can't be queried from the device properties, so here we set set this. Based on Table 14 of the CUDA Programming Guide 10.0 (Technical Specifications per Compute Capability) More... | |
template<typename F > | |
void | setMaxDynamicSharedBytesPerBlock (F *func) const |
Enable the maximum dynamic shared bytes for the kernel "func" (values given by maxDynamicSharedBytesPerBlock()). More... | |
unsigned int | maxDynamicSharedBytesPerBlock () const |
This can't be correctly queried in CUDA for all architectures so here we set set this. Based on Table 14 of the CUDA Programming Guide 10.0 (Technical Specifications per Compute Capability). More... | |
virtual unsigned int | maxSharedBytesPerBlock () const |
The maximum shared memory that a CUDA thread block can use in the autotuner. This isn't necessarily the same as maxDynamicSharedMemoryPerBlock since that may need explicit opt in to enable (by calling setMaxDynamicSharedBytes for the kernel in question). If the CUDA kernel in question does this opt in then this function can be overloaded to return maxDynamicSharedBytesPerBlock. More... | |
virtual bool | advanceSharedBytes (TuneParam ¶m) const |
virtual bool | advanceAux (TuneParam ¶m) const |
int | writeAuxString (const char *format,...) |
Protected Attributes | |
Arg & | arg |
const ColorSpinorField & | meta |
![]() | |
unsigned int | vector_length_y |
unsigned int | step_y |
bool | tune_block_x |
![]() | |
char | aux [TuneKey::aux_n] |
CUresult | jitify_error |
Static Private Attributes | |
static constexpr int | ndim = 4 |
|
inline |
|
inline |
|
inline |
Definition at line 266 of file dslash_quda.cu.
References quda::LatticeField::AuxString().
|
inlinevirtual |
Definition at line 270 of file dslash_quda.cu.
|
inline |
Definition at line 221 of file gamma.cuh.
References QUDA_DEGRAND_ROSSI_GAMMA_BASIS, and QUDA_UKQCD_GAMMA_BASIS.
Referenced by quda::ApplyGamma(), and quda::multiplyVUV().
|
inlinevirtual |
Implements quda::Tunable.
Definition at line 272 of file dslash_quda.cu.
References quda::arg(), quda::TuneParam::block, errorQuda, getTuning(), getVerbosity(), quda::TuneParam::grid, quda::LatticeField::Location(), QUDA_CPU_FIELD_LOCATION, quda::TuneParam::shared_bytes, and quda::tuneLaunch().
|
inlineprotectedvirtual |
Reimplemented from quda::Tunable.
Definition at line 261 of file dslash_quda.cu.
|
inline |
|
inlineprotectedvirtual |
Implements quda::Tunable.
Definition at line 260 of file dslash_quda.cu.
|
inline |
Definition at line 28 of file gamma.cuh.
References QUDA_DEGRAND_ROSSI_GAMMA_BASIS.
Referenced by quda::Gamma< ValueType, basis, dir >::getelem(), quda::Gamma< ValueType, basis, dir >::getrowelem(), and quda::multiplyVUV().
|
inline |
Definition at line 98 of file gamma.cuh.
References QUDA_DEGRAND_ROSSI_GAMMA_BASIS, and QUDA_UKQCD_GAMMA_BASIS.
Referenced by quda::Gamma< ValueType, basis, dir >::getelem(), and quda::Gamma< ValueType, basis, dir >::getrowelem().
|
inline |
Definition at line 209 of file gamma.cuh.
References quda::Gamma< ValueType, basis, dir >::getcol(), and quda::Gamma< ValueType, basis, dir >::getelem().
|
inline |
Definition at line 215 of file gamma.cuh.
References quda::Gamma< ValueType, basis, dir >::getcol(), and quda::Gamma< ValueType, basis, dir >::getelem().
|
inlineprotectedvirtual |
Reimplemented from quda::Tunable.
Definition at line 263 of file dslash_quda.cu.
References quda::Arg< real, Ns, Nc, order >::volumeCB.
|
inlinevirtual |
Reimplemented from quda::Tunable.
Definition at line 287 of file dslash_quda.cu.
|
inlinevirtual |
Reimplemented from quda::Tunable.
Definition at line 286 of file dslash_quda.cu.
|
inlineprotectedvirtual |
Reimplemented from quda::Tunable.
Definition at line 262 of file dslash_quda.cu.
|
inlinevirtual |
Implements quda::Tunable.
Definition at line 284 of file dslash_quda.cu.
References quda::LatticeField::VolString().
|
protected |
Definition at line 257 of file dslash_quda.cu.
|
protected |
Definition at line 258 of file dslash_quda.cu.
|
staticprivate |