QUDA
1.0.0
|
#include <quda_constants.h>
#include <float_vector.h>
#include <comm_quda.h>
#include <blas_quda.h>
#include <cub/block/block_reduce.cuh>
Go to the source code of this file.
Classes | |
struct | quda::vector_type< scalar, n > |
struct | quda::ReduceArg< T > |
struct | quda::reduce_vector< T > |
Namespaces | |
quda | |
Functions | |
template<typename scalar , int n> | |
__device__ __host__ void | quda::zero (vector_type< scalar, n > &v) |
template<typename scalar , int n> | |
__device__ __host__ vector_type< scalar, n > | quda::operator+ (const vector_type< scalar, n > &a, const vector_type< scalar, n > &b) |
template<int block_size_x, int block_size_y, typename T , bool do_sum = true, typename Reducer = cub::Sum> | |
__device__ void | quda::reduce2d (ReduceArg< T > arg, const T &in, const int idx=0) |
template<int block_size, typename T , bool do_sum = true, typename Reducer = cub::Sum> | |
__device__ void | quda::reduce (ReduceArg< T > arg, const T &in, const int idx=0) |
template<int block_size_x, int block_size_y, typename T > | |
__device__ void | quda::reduceRow (ReduceArg< T > arg, const T &in) |
Variables | |
__device__ unsigned int | quda::count [QUDA_MAX_MULTI_REDUCE] = { } |
__shared__ bool | quda::isLastBlockDone |
__shared__ volatile bool | quda::isLastWarpDone [16] |
Provides helper functors for custom datatypes for cub algorithms.
Definition in file cub_helper.cuh.