QUDA v0.4.0
A library for QCD on GPUs
|
advanceBlockDim(TuneParam ¶m) const | DslashCuda | [inline, protected, virtual] |
advanceGridDim(TuneParam ¶m) const | DslashCuda | [inline, protected, virtual] |
advanceSharedBytes(TuneParam ¶m) const | Tunable | [inline, protected, virtual] |
advanceTuneParam(TuneParam ¶m) const | Tunable | [inline, virtual] |
apply(const cudaStream_t &stream) | StaggeredDslashCuda< sFloat, fatGFloat, longGFloat > | [inline, virtual] |
DslashCuda::bytes() const | Tunable | [inline, protected, virtual] |
defaultTuneParam(TuneParam ¶m) const | DslashCuda | [inline, virtual] |
DslashCuda() | DslashCuda | [inline] |
flops() const | Tunable | [inline, protected, virtual] |
initTuneParam(TuneParam ¶m) const | DslashCuda | [inline, virtual] |
Nface() | StaggeredDslashCuda< sFloat, fatGFloat, longGFloat > | [inline, virtual] |
paramString(const TuneParam ¶m) const | DslashCuda | [inline, virtual] |
perfString(float time) const | Tunable | [inline, virtual] |
postTune() | StaggeredDslashCuda< sFloat, fatGFloat, longGFloat > | [inline, virtual] |
preTune() | StaggeredDslashCuda< sFloat, fatGFloat, longGFloat > | [inline, virtual] |
sharedBytesPerBlock() const | DslashCuda | [inline, protected, virtual] |
sharedBytesPerThread() const | StaggeredDslashCuda< sFloat, fatGFloat, longGFloat > | [inline, protected, virtual] |
StaggeredDslashCuda(sFloat *out, float *outNorm, const fatGFloat *fat0, const fatGFloat *fat1, const longGFloat *long0, const longGFloat *long1, const QudaReconstructType reconstruct, const sFloat *in, const float *inNorm, const sFloat *x, const float *xNorm, const double a, const int dagger, const size_t bytes, const size_t norm_bytes) | StaggeredDslashCuda< sFloat, fatGFloat, longGFloat > | [inline] |
Tunable() | Tunable | [inline] |
tuneKey() const | StaggeredDslashCuda< sFloat, fatGFloat, longGFloat > | [inline, virtual] |
tuningIter() const | Tunable | [inline, virtual] |
~DslashCuda() | DslashCuda | [inline, virtual] |
~StaggeredDslashCuda() | StaggeredDslashCuda< sFloat, fatGFloat, longGFloat > | [inline, virtual] |
~Tunable() | Tunable | [inline, virtual] |