|
QUDA v0.4.0
A library for QCD on GPUs
|
#include <reduce_core.h>
Inheritance diagram for ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >:Public Member Functions | |
| ReduceCuda (doubleN &result, InputX &X, InputY &Y, InputZ &Z, InputW &W, InputV &V, Reducer &r, OutputX &XX, OutputY &YY, OutputZ &ZZ, int length) | |
| virtual | ~ReduceCuda () |
| TuneKey | tuneKey () const |
| void | apply (const cudaStream_t &stream) |
| void | preTune () |
| void | postTune () |
| long long | flops () const |
| long long | bytes () const |
Definition at line 356 of file reduce_core.h.
| ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::ReduceCuda | ( | doubleN & | result, |
| InputX & | X, | ||
| InputY & | Y, | ||
| InputZ & | Z, | ||
| InputW & | W, | ||
| InputV & | V, | ||
| Reducer & | r, | ||
| OutputX & | XX, | ||
| OutputY & | YY, | ||
| OutputZ & | ZZ, | ||
| int | length | ||
| ) | [inline] |
Definition at line 396 of file reduce_core.h.
| virtual ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::~ReduceCuda | ( | ) | [inline, virtual] |
Definition at line 400 of file reduce_core.h.
| void ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::apply | ( | const cudaStream_t & | stream | ) | [inline, virtual] |
Implements Tunable.
Definition at line 412 of file reduce_core.h.
| long long ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::bytes | ( | ) | const [inline, virtual] |
Reimplemented from Tunable.
Definition at line 435 of file reduce_core.h.
| long long ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::flops | ( | ) | const [inline, virtual] |
Reimplemented from Tunable.
Definition at line 434 of file reduce_core.h.
| void ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::postTune | ( | ) | [inline, virtual] |
Reimplemented from Tunable.
Definition at line 426 of file reduce_core.h.
| void ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::preTune | ( | ) | [inline, virtual] |
Reimplemented from Tunable.
Definition at line 418 of file reduce_core.h.
| TuneKey ReduceCuda< doubleN, ReduceType, ReduceSimpleType, FloatN, M, writeX, writeY, writeZ, InputX, InputY, InputZ, InputW, InputV, Reducer, OutputX, OutputY, OutputZ >::tuneKey | ( | ) | const [inline, virtual] |
Implements Tunable.
Definition at line 402 of file reduce_core.h.
1.7.4