|
QUDA v0.4.0
A library for QCD on GPUs
|
| advanceBlockDim(TuneParam ¶m) const | DslashCuda | [inline, protected, virtual] |
| advanceGridDim(TuneParam ¶m) const | DslashCuda | [inline, protected, virtual] |
| advanceSharedBytes(TuneParam ¶m) const | Tunable | [inline, protected, virtual] |
| advanceTuneParam(TuneParam ¶m) const | Tunable | [inline, virtual] |
| apply(const cudaStream_t &stream)=0 | Tunable | [pure virtual] |
| bytes() const | Tunable | [inline, protected, virtual] |
| defaultTuneParam(TuneParam ¶m) const | DslashCuda | [inline, virtual] |
| DslashCuda() | DslashCuda | [inline] |
| flops() const | Tunable | [inline, protected, virtual] |
| initTuneParam(TuneParam ¶m) const | DslashCuda | [inline, virtual] |
| Nface() | DslashCuda | [inline, virtual] |
| paramString(const TuneParam ¶m) const | DslashCuda | [inline, virtual] |
| perfString(float time) const | Tunable | [inline, virtual] |
| postTune() | Tunable | [inline, virtual] |
| preTune() | Tunable | [inline, virtual] |
| sharedBytesPerBlock() const | DslashCuda | [inline, protected, virtual] |
| sharedBytesPerThread() const =0 | Tunable | [protected, pure virtual] |
| SharedDslashCuda() | SharedDslashCuda | [inline] |
| Tunable() | Tunable | [inline] |
| tuneKey() const | DslashCuda | [virtual] |
| tuningIter() const | Tunable | [inline, virtual] |
| ~DslashCuda() | DslashCuda | [inline, virtual] |
| ~SharedDslashCuda() | SharedDslashCuda | [inline, virtual] |
| ~Tunable() | Tunable | [inline, virtual] |
1.7.4