QUDA v0.4.0
A library for QCD on GPUs
|
#include <misc_helpers.h>
Go to the source code of this file.
Defines | |
#define | gaugeSiteSize 18 |
#define | BLOCKSIZE 64 |
#define | READ_ST_STAPLE(staple, idx, mystride) |
#define | WRITE_ST_STAPLE(staple, idx, mystride) |
Functions | |
template<int N, typename FloatN , typename Float2 > | |
__global__ void | do_link_format_cpu_to_gpu (FloatN *dst, Float2 *src, int reconstruct, int Vh, int pad, int ghostV, size_t threads) |
template<int N, typename FloatN , typename Float2 > | |
__global__ void | do_link_format_cpu_to_gpu_milc (FloatN *dst, Float2 *src, int reconstruct, int Vh, int pad, int ghostV, size_t threads) |
void | link_format_cpu_to_gpu (void *dst, void *src, int reconstruct, int Vh, int pad, int ghostV, QudaPrecision prec, QudaGaugeFieldOrder cpu_order, cudaStream_t stream) |
template<typename FloatN > | |
__global__ void | do_link_format_gpu_to_cpu (FloatN *dst, FloatN *src, int Vh, int stride) |
void | link_format_gpu_to_cpu (void *dst, void *src, int Vh, int stride, QudaPrecision prec, cudaStream_t stream) |
template<int dir, int whichway, typename Float2 > | |
__global__ void | collectGhostStapleKernel (Float2 *in, const int oddBit, Float2 *nbr_staple_gpu) |
void | collectGhostStaple (int *X, void *even, void *odd, int volume, QudaPrecision precision, void *ghost_staple_gpu, int dir, int whichway, cudaStream_t *stream) |
#define BLOCKSIZE 64 |
Definition at line 4 of file misc_helpers.cu.
#define gaugeSiteSize 18 |
Definition at line 3 of file misc_helpers.cu.
#define READ_ST_STAPLE | ( | staple, | |
idx, | |||
mystride | |||
) |
Float2 P0 = staple[idx + 0*mystride]; \ Float2 P1 = staple[idx + 1*mystride]; \ Float2 P2 = staple[idx + 2*mystride]; \ Float2 P3 = staple[idx + 3*mystride]; \ Float2 P4 = staple[idx + 4*mystride]; \ Float2 P5 = staple[idx + 5*mystride]; \ Float2 P6 = staple[idx + 6*mystride]; \ Float2 P7 = staple[idx + 7*mystride]; \ Float2 P8 = staple[idx + 8*mystride];
Definition at line 365 of file misc_helpers.cu.
#define WRITE_ST_STAPLE | ( | staple, | |
idx, | |||
mystride | |||
) |
staple[idx + 0*mystride] = P0; \ staple[idx + 1*mystride] = P1; \ staple[idx + 2*mystride] = P2; \ staple[idx + 3*mystride] = P3; \ staple[idx + 4*mystride] = P4; \ staple[idx + 5*mystride] = P5; \ staple[idx + 6*mystride] = P6; \ staple[idx + 7*mystride] = P7; \ staple[idx + 8*mystride] = P8;
Definition at line 376 of file misc_helpers.cu.
void collectGhostStaple | ( | int * | X, |
void * | even, | ||
void * | odd, | ||
int | volume, | ||
QudaPrecision | precision, | ||
void * | ghost_staple_gpu, | ||
int | dir, | ||
int | whichway, | ||
cudaStream_t * | stream | ||
) |
Definition at line 471 of file misc_helpers.cu.
__global__ void collectGhostStapleKernel | ( | Float2 * | in, |
const int | oddBit, | ||
Float2 * | nbr_staple_gpu | ||
) |
Definition at line 391 of file misc_helpers.cu.
__global__ void do_link_format_cpu_to_gpu | ( | FloatN * | dst, |
Float2 * | src, | ||
int | reconstruct, | ||
int | Vh, | ||
int | pad, | ||
int | ghostV, | ||
size_t | threads | ||
) |
Definition at line 41 of file misc_helpers.cu.
__global__ void do_link_format_cpu_to_gpu_milc | ( | FloatN * | dst, |
Float2 * | src, | ||
int | reconstruct, | ||
int | Vh, | ||
int | pad, | ||
int | ghostV, | ||
size_t | threads | ||
) |
Definition at line 101 of file misc_helpers.cu.
__global__ void do_link_format_gpu_to_cpu | ( | FloatN * | dst, |
FloatN * | src, | ||
int | Vh, | ||
int | stride | ||
) |
Definition at line 319 of file misc_helpers.cu.
void link_format_cpu_to_gpu | ( | void * | dst, |
void * | src, | ||
int | reconstruct, | ||
int | Vh, | ||
int | pad, | ||
int | ghostV, | ||
QudaPrecision | prec, | ||
QudaGaugeFieldOrder | cpu_order, | ||
cudaStream_t | stream | ||
) |
Definition at line 142 of file misc_helpers.cu.
void link_format_gpu_to_cpu | ( | void * | dst, |
void * | src, | ||
int | Vh, | ||
int | stride, | ||
QudaPrecision | prec, | ||
cudaStream_t | stream | ||
) |
Definition at line 344 of file misc_helpers.cu.