| advanceAux(TuneParam ¶m) const | quda::Tunable | inlineprotectedvirtual |
| advanceBlockDim(TuneParam ¶m) const | quda::Tunable | inlineprotectedvirtual |
| advanceGridDim(TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| advanceSharedBytes(TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlineprivatevirtual |
| advanceTuneParam(TuneParam ¶m) const | quda::Tunable | inlinevirtual |
| apply(const cudaStream_t &stream) | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| arg | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| aux | quda::Tunable | protected |
| blockMin() const | quda::Tunable | inlineprotectedvirtual |
| blockStep() const | quda::Tunable | inlineprotectedvirtual |
| bytes() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| checkLaunchParam(TuneParam ¶m) | quda::Tunable | inline |
| defaultTuneParam(TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| flops() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| gridStep() const | quda::Tunable | inlineprotectedvirtual |
| initTuneParam(TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| jitify_error | quda::Tunable | protected |
| jitifyError() const | quda::Tunable | inline |
| jitifyError() | quda::Tunable | inline |
| maxBlockSize(const TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlineprivatevirtual |
| maxBlocksPerSM() const | quda::Tunable | inlineprotected |
| maxDynamicSharedBytesPerBlock() const | quda::Tunable | inlineprotected |
| maxGridSize() const | quda::Tunable | inlineprotectedvirtual |
| maxSharedBytesPerBlock() const | quda::Tunable | inlineprotectedvirtual |
| minGridSize() const | quda::Tunable | inlineprotectedvirtual |
| minThreads() const | quda::Tunable | inlineprotectedvirtual |
| MultiReduceCuda(doubleN result[], SpinorX X[], SpinorY Y[], SpinorZ Z[], SpinorW W[], Reducer &r, std::vector< ColorSpinorField *> &x, std::vector< ColorSpinorField *> &y, std::vector< ColorSpinorField *> &z, std::vector< ColorSpinorField *> &w, int NYW, int length) | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inline |
| nParity | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| NYW | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| paramString(const TuneParam ¶m) const | quda::Tunable | inlinevirtual |
| perfString(float time) const | quda::Tunable | inlinevirtual |
| postTune() | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| preTune() | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| resetBlockDim(TuneParam ¶m) const | quda::Tunable | inlineprotectedvirtual |
| result | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| setMaxDynamicSharedBytesPerBlock(F *func) const | quda::Tunable | inlineprotected |
| sharedBytesPerBlock(const TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlineprivatevirtual |
| sharedBytesPerThread() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlineprivatevirtual |
| Tunable() | quda::Tunable | inline |
| tuneAuxDim() const | quda::Tunable | inlineprotectedvirtual |
| tuneGridDim() const | quda::Tunable | inlineprotectedvirtual |
| tuneKey() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| tuneSharedBytes() const | quda::Tunable | inlineprotectedvirtual |
| tuningIter() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
| w | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| W_h | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| Wnorm_h | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| writeAuxString(const char *format,...) | quda::Tunable | inlineprotected |
| x | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| y | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| Y_h | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| Ynorm_h | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| z | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
| ~Tunable() | quda::Tunable | inlinevirtual |