advanceAux(TuneParam ¶m) const | quda::Tunable | inlineprotectedvirtual |
advanceBlockDim(TuneParam ¶m) const | quda::Tunable | inlineprotectedvirtual |
advanceGridDim(TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
advanceSharedBytes(TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlineprivatevirtual |
advanceTuneParam(TuneParam ¶m) const | quda::Tunable | inlinevirtual |
apply(const cudaStream_t &stream) | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
arg | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
aux | quda::Tunable | protected |
blockMin() const | quda::Tunable | inlineprotectedvirtual |
blockStep() const | quda::Tunable | inlineprotectedvirtual |
bytes() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
checkLaunchParam(TuneParam ¶m) | quda::Tunable | inline |
defaultTuneParam(TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
flops() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
gridStep() const | quda::Tunable | inlineprotectedvirtual |
initTuneParam(TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
jitify_error | quda::Tunable | protected |
jitifyError() const | quda::Tunable | inline |
jitifyError() | quda::Tunable | inline |
maxBlockSize(const TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlineprivatevirtual |
maxBlocksPerSM() const | quda::Tunable | inlineprotected |
maxDynamicSharedBytesPerBlock() const | quda::Tunable | inlineprotected |
maxGridSize() const | quda::Tunable | inlineprotectedvirtual |
maxSharedBytesPerBlock() const | quda::Tunable | inlineprotectedvirtual |
minGridSize() const | quda::Tunable | inlineprotectedvirtual |
minThreads() const | quda::Tunable | inlineprotectedvirtual |
MultiReduceCuda(doubleN result[], SpinorX X[], SpinorY Y[], SpinorZ Z[], SpinorW W[], Reducer &r, std::vector< ColorSpinorField *> &x, std::vector< ColorSpinorField *> &y, std::vector< ColorSpinorField *> &z, std::vector< ColorSpinorField *> &w, int NYW, int length) | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inline |
nParity | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
NYW | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
paramString(const TuneParam ¶m) const | quda::Tunable | inlinevirtual |
perfString(float time) const | quda::Tunable | inlinevirtual |
postTune() | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
preTune() | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
resetBlockDim(TuneParam ¶m) const | quda::Tunable | inlineprotectedvirtual |
result | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
setMaxDynamicSharedBytesPerBlock(F *func) const | quda::Tunable | inlineprotected |
sharedBytesPerBlock(const TuneParam ¶m) const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlineprivatevirtual |
sharedBytesPerThread() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlineprivatevirtual |
Tunable() | quda::Tunable | inline |
tuneAuxDim() const | quda::Tunable | inlineprotectedvirtual |
tuneGridDim() const | quda::Tunable | inlineprotectedvirtual |
tuneKey() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
tuneSharedBytes() const | quda::Tunable | inlineprotectedvirtual |
tuningIter() const | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | inlinevirtual |
w | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
W_h | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
Wnorm_h | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
writeAuxString(const char *format,...) | quda::Tunable | inlineprotected |
x | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
y | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
Y_h | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
Ynorm_h | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
z | quda::blas::MultiReduceCuda< NXZ, doubleN, ReduceType, FloatN, M, SpinorX, SpinorY, SpinorZ, SpinorW, Reducer > | private |
~Tunable() | quda::Tunable | inlinevirtual |