3 #define DSLASH_SHARED_FLOATS_PER_THREAD 0 6 #if (CUDA_VERSION >= 4010) 9 #define VOLATILE volatile 13 #define spinorFloat double 15 #if CUDA_VERSION >= 6050 && CUDA_VERSION < 7050 16 #define POW(a, b) pow(a, static_cast<spinorFloat>(b)) 18 #define POW(a, b) pow(a, b) 46 #define mdwf_b5 param.mdwf_b5_d 47 #define mdwf_c5 param.mdwf_c5_d 48 #define mferm param.mferm 52 #define spinorFloat float 53 #define POW(a, b) __fast_pow(a, b) 79 #define mdwf_b5 param.mdwf_b5_f 80 #define mdwf_c5 param.mdwf_c5_f 81 #define mferm param.mferm_f 84 #endif // SPINOR_DOUBLE 113 #if (__COMPUTE_CAPABILITY__ >= 200) 114 #define SHARED_STRIDE 16 // to avoid bank conflicts on Fermi 116 #define SHARED_STRIDE 8 // to avoid bank conflicts on G80 and GT200 119 #if (__COMPUTE_CAPABILITY__ >= 200) 120 #define SHARED_STRIDE 32 // to avoid bank conflicts on Fermi 122 #define SHARED_STRIDE 16 // to avoid bank conflicts on G80 and GT200 155 #ifdef MDWF_mode // Check whether MDWF option is enabled 159 #endif // select MDWF mode 169 int base_idx =
sid%
param.dc.volume_4d_cb;
249 READ_ACCUM(ACCUMTEX,
param.sp_stride)
310 #endif // SPINOR_DOUBLE 311 #endif // DSLASH_XPAY
VOLATILE spinorFloat o21_re
VOLATILE spinorFloat o12_im
VOLATILE spinorFloat o20_re
VOLATILE spinorFloat o32_re
VOLATILE spinorFloat o22_im
VOLATILE spinorFloat o11_im
VOLATILE spinorFloat o02_re
VOLATILE spinorFloat o12_re
VOLATILE spinorFloat kappa
VOLATILE spinorFloat o01_re
VOLATILE spinorFloat o31_im
VOLATILE spinorFloat o10_im
VOLATILE spinorFloat o02_im
VOLATILE spinorFloat o30_re
VOLATILE spinorFloat o01_im
VOLATILE spinorFloat o11_re
VOLATILE spinorFloat o00_re
VOLATILE spinorFloat o32_im
VOLATILE spinorFloat o31_re
VOLATILE spinorFloat o30_im
VOLATILE spinorFloat o00_im
VOLATILE spinorFloat o20_im
VOLATILE spinorFloat o21_im
VOLATILE spinorFloat o22_re
VOLATILE spinorFloat o10_re