QUDA v0.4.0
A library for QCD on GPUs
|
#include <reduce_core.h>
Public Member Functions | |
ReduceCuda (doubleN &result, InputX &X, InputY &Y, InputZ &Z, InputW &W, InputV &V, Reducer &r, OutputX &XX, OutputY &YY, OutputZ &ZZ, int length) | |
virtual | ~ReduceCuda () |
TuneKey | tuneKey () const |
void | apply (const cudaStream_t &stream) |
void | preTune () |
void | postTune () |
long long | flops () const |
long long | bytes () const |
Definition at line 356 of file reduce_core.h.
ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::ReduceCuda | ( | doubleN & | result, |
InputX & | X, | ||
InputY & | Y, | ||
InputZ & | Z, | ||
InputW & | W, | ||
InputV & | V, | ||
Reducer & | r, | ||
OutputX & | XX, | ||
OutputY & | YY, | ||
OutputZ & | ZZ, | ||
int | length | ||
) | [inline] |
Definition at line 396 of file reduce_core.h.
virtual ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::~ReduceCuda | ( | ) | [inline, virtual] |
Definition at line 400 of file reduce_core.h.
void ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::apply | ( | const cudaStream_t & | stream | ) | [inline, virtual] |
Implements Tunable.
Definition at line 412 of file reduce_core.h.
long long ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::bytes | ( | ) | const [inline, virtual] |
Reimplemented from Tunable.
Definition at line 435 of file reduce_core.h.
long long ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::flops | ( | ) | const [inline, virtual] |
Reimplemented from Tunable.
Definition at line 434 of file reduce_core.h.
void ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::postTune | ( | ) | [inline, virtual] |
Reimplemented from Tunable.
Definition at line 426 of file reduce_core.h.
void ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::preTune | ( | ) | [inline, virtual] |
Reimplemented from Tunable.
Definition at line 418 of file reduce_core.h.
TuneKey ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::tuneKey | ( | ) | const [inline, virtual] |
Implements Tunable.
Definition at line 402 of file reduce_core.h.