v0.9.0/doc/texture_8h_source.html

 #ifndef _TEXTURE_H
 #define _TEXTURE_H

 // FIXME - it would not be too hard to get this working on the host as well

 #include <convert.h>

 #ifdef USE_TEXTURE_OBJECTS

 template<typename OutputType, typename InputType>
 class Texture {

   typedef typename quda::mapper<InputType>::type RegType;

 private:
 #ifndef DIRECT_ACCESS_BLAS
   cudaTextureObject_t spinor;
 #else
   const InputType *spinor; // used when textures are disabled
 #endif

 public:
   Texture() : spinor(0) { }
 #ifndef DIRECT_ACCESS_BLAS
   Texture(const cudaColorSpinorField *x, bool use_ghost = false)
     : spinor(use_ghost ? x->GhostTex() : x->Tex()) { }
 #else
   Texture(const cudaColorSpinorField *x, bool use_ghost = false)
     : spinor(use_ghost ? (const InputType*)(x->Ghost2()) : (const InputType*)(x->V())) { }
 #endif
   Texture(const Texture &tex) : spinor(tex.spinor) { }
   ~Texture() { }

   Texture& operator=(const Texture &tex) {
     if (this != &tex) spinor = tex.spinor;
     return *this;
   }

 #ifndef DIRECT_ACCESS_BLAS
   __device__ inline OutputType fetch(unsigned int idx)
   {
     OutputType rtn;
     copyFloatN(rtn, tex1Dfetch<RegType>(spinor, idx));
     return rtn;
   }
 #else
   __device__ inline OutputType fetch(unsigned int idx)
   { OutputType out; copyFloatN(out, spinor[idx]); return out; }
 #endif

   __device__ inline OutputType operator[](unsigned int idx) { return fetch(idx); }
 };

 #ifndef DIRECT_ACCESS_BLAS
 __device__ inline double fetch_double(int2 v)
 { return __hiloint2double(v.y, v.x); }

 __device__ inline double2 fetch_double2(int4 v)
 { return make_double2(__hiloint2double(v.y, v.x), __hiloint2double(v.w, v.z)); }

 template<> __device__ inline double2 Texture<double2,double2>::fetch(unsigned int idx)
 { double2 out; copyFloatN(out, fetch_double2(tex1Dfetch<int4>(spinor, idx))); return out; }

 template<> __device__ inline float2 Texture<float2,double2>::fetch(unsigned int idx)
 { float2 out; copyFloatN(out, fetch_double2(tex1Dfetch<int4>(spinor, idx))); return out; }
 #endif

 #else

 // legacy Texture references

 #if (__COMPUTE_CAPABILITY__ >= 130)

   __inline__ __device__ double fetch_double(texture<int2, 1> t, int i)
   {
     int2 v = tex1Dfetch(t,i);
     return __hiloint2double(v.y, v.x);
   }

   __inline__ __device__ double2 fetch_double2(texture<int4, 1> t, int i)
   {
     int4 v = tex1Dfetch(t,i);
     return make_double2(__hiloint2double(v.y, v.x), __hiloint2double(v.w, v.z));
   }
 #else
   __inline__ __device__ double fetch_double(texture<int2, 1> t, int i){ return 0.0; }

   __inline__ __device__ double2 fetch_double2(texture<int4, 1> t, int i)
   {
     // do nothing
     return make_double2(0.0, 0.0);
   }
 #endif

 #define MAX_TEXELS (1<<27)

 #define MAX_TEX_ID 4

 // dynamically keep track of texture references we've already bound to
 bool tex_id_table[MAX_TEX_ID] = { };

 template<typename OutputType, typename InputType, int tex_id>
   class Texture {

   private:
 #ifdef DIRECT_ACCESS_BLAS
   const InputType *spinor; // used when textures are disabled
   size_t bytes;
 #endif
   static bool bound;
   static int count;

   public:
   Texture()
 #ifdef DIRECT_ACCESS_BLAS
   : spinor(0), bytes(0)
 #endif
   { count++; }

  Texture(const cudaColorSpinorField *x, bool use_ghost = false)
 #ifdef DIRECT_ACCESS_BLAS
    : spinor( use_ghost ? (const InputType*)(x->Ghost2()) : (const InputType*)(x->V())) { }
 #endif
   {
     // only bind if bytes > 0
     if (x->Bytes()) {
       if (tex_id >= 0 && tex_id < MAX_TEX_ID) {
   if (tex_id_table[(tex_id >= 0 && tex_id < MAX_TEX_ID) ? tex_id : 0]) {
     errorQuda("Already bound to this texture reference");
   } else {
     tex_id_table[(tex_id >= 0 && tex_id < MAX_TEX_ID) ? tex_id : 0] = true;
   }
       }
       if (use_ghost) bind((const InputType*)(x->Ghost2()), x->GhostBytes());
       else bind((const InputType*)x->V(), x->Bytes()); bound = true;
     }
     count++;
   }

   Texture(const Texture &tex)
 #ifdef DIRECT_ACCESS_BLAS
   : spinor(tex.spinor), bytes(tex.bytes)
 #endif
   { count++; }

   ~Texture() {
     if (bound && !--count) {
       unbind(); bound = false; tex_id_table[(tex_id >= 0 && tex_id < MAX_TEX_ID) ? tex_id : 0]=false;
     }
   }

   Texture& operator=(const Texture &tex) {
 #ifdef DIRECT_ACCESS_BLAS
     spinor = tex.spinor;
     bytes = tex.bytes;
 #endif
     return *this;
   }

   inline void bind(const InputType*, size_t bytes){ /*errorQuda("Texture id is out of range");*/ }
   inline void unbind() { /*errorQuda("Texture id is out of range");*/ }

   //default should only be called if a tex_id is out of range
   __device__ inline OutputType fetch(unsigned int idx) { OutputType x; x.x =0; return x; };
   __device__ inline OutputType operator[](unsigned int idx) { return fetch(idx); }
 };

   template<typename OutputType, typename InputType, int tex_id>
     bool Texture<OutputType, InputType, tex_id>::bound = false;

   template<typename OutputType, typename InputType, int tex_id>
     int Texture<OutputType, InputType, tex_id>::count = 0;

 #define DECL_TEX(id)              \
   texture<short2,1,cudaReadModeNormalizedFloat> tex_short2_##id;  \
   texture<short4,1,cudaReadModeNormalizedFloat> tex_short4_##id;  \
   texture<float,1> tex_float_##id;          \
   texture<float2,1> tex_float2_##id;          \
   texture<float4,1> tex_float4_##id;          \
   texture<int4,1> tex_double2_##id;


 #define DEF_BIND_UNBIND(outtype, intype, id)        \
   template<> inline void Texture<outtype,intype,id>::bind(const intype *ptr, size_t bytes) \
     { cudaBindTexture(0,tex_##intype##_##id, ptr, bytes); }   \
   template<> inline void Texture<outtype,intype,id>::unbind() { cudaUnbindTexture(tex_##intype##_##id); }


 #define DEF_FETCH_TEX(outtype, intype, id)        \
   template<> __device__ inline outtype Texture<outtype,intype,id>::fetch(unsigned int idx) \
     { return tex1Dfetch(tex_##intype##_##id,idx); }


 #define DEF_FETCH_DIRECT(outtype, intype, id)       \
   template<> __device__ inline outtype Texture<outtype,intype,id>::fetch(unsigned int idx) \
     { outtype out; copyFloatN(out, spinor[idx]); return out; }


 #if defined(DIRECT_ACCESS_BLAS)
 #define DEF_FETCH DEF_FETCH_DIRECT
 #else
 #define DEF_FETCH DEF_FETCH_TEX
 #endif


 #if defined(DIRECT_ACCESS_BLAS) || defined(FERMI_NO_DBLE_TEX)
 #define DEF_FETCH_DBLE DEF_FETCH_DIRECT
 #else
 #define DEF_FETCH_DBLE(outtype, intype, id)       \
   template<> __device__ inline outtype Texture<outtype,double2,id>::fetch(unsigned int idx) \
     { outtype out; copyFloatN(out, fetch_double2(tex_double2_##id,idx)); return out; }
 #endif

 #if defined(DIRECT_ACCESS_BLAS) || defined(FERMI_NO_DBLE_TEX)
 #define DEF_FETCH_DBLE_MIXED DEF_FETCH_DIRECT
 #else
 #define DEF_FETCH_DBLE_MIXED(outtype, intype, id)                      \
   template<> __device__ inline outtype Texture<outtype,intype,id>::fetch(unsigned int idx) \
   { outtype out; copyFloatN(out, tex1Dfetch(tex_##intype##_##id,idx)); return out; }
 #endif


 #define DEF_BIND_UNBIND_FETCH(outtype, intype, id)  \
   DEF_BIND_UNBIND(outtype, intype, id)      \
   DEF_FETCH(outtype, intype, id)


 #define DEF_ALL(id)       \
   DECL_TEX(id)          \
   DEF_BIND_UNBIND_FETCH(float2, short2, id) \
   DEF_BIND_UNBIND_FETCH(float4, short4, id) \
   DEF_BIND_UNBIND_FETCH(float, float, id) \
   DEF_BIND_UNBIND_FETCH(float2, float2, id) \
   DEF_BIND_UNBIND_FETCH(float4, float4, id) \
   DEF_BIND_UNBIND(double2, double2, id)   \
   DEF_BIND_UNBIND(float2, double2, id)    \
   DEF_FETCH_DBLE(double2, double2, id)    \
   DEF_FETCH_DBLE(float2, double2, id)   \
   DEF_BIND_UNBIND(double2, float2, id)    \
   DEF_BIND_UNBIND(double4, float4, id)    \
   DEF_BIND_UNBIND(double2, short2, id)    \
   DEF_BIND_UNBIND(double4, short4, id)    \
   DEF_FETCH_DBLE_MIXED(double2, float2, id) \
   DEF_FETCH_DBLE_MIXED(double4, float4, id) \
   DEF_FETCH_DBLE_MIXED(double2, short2, id) \
   DEF_FETCH_DBLE_MIXED(double4, short4, id)

   // Declare the textures and define the member functions of the corresponding templated classes.
   DEF_ALL(0)
   DEF_ALL(1)
   DEF_ALL(2)
   DEF_ALL(3)
   DEF_ALL(4)

 #undef DECL_TEX
 #undef DEF_BIND_UNBIND
 #undef DEF_FETCH_DIRECT
 #undef DEF_FETCH_TEX
 #undef DEF_FETCH
 #undef DEF_FETCH_DBLE
 #undef DEF_BIND_UNBIND_FETCH
 #undef DEF_ALL

 #endif // USE_TEXTURE_OBJECTS


   template <typename RegType, typename InterType, typename StoreType>
     void checkTypes() {

     const size_t reg_size = sizeof(((RegType*)0)->x);
     const size_t inter_size = sizeof(((InterType*)0)->x);
     const size_t store_size = sizeof(((StoreType*)0)->x);

     if (reg_size != inter_size  && store_size != 2 && inter_size != 4)
       errorQuda("Precision of register (%lu) and intermediate (%lu) types must match\n",
     (unsigned long)reg_size, (unsigned long)inter_size);

     if (vecLength<InterType>() != vecLength<StoreType>()) {
       errorQuda("Vector lengths intermediate and register types must match\n");
     }

     if (vecLength<RegType>() == 0) errorQuda("Vector type not supported\n");
     if (vecLength<InterType>() == 0) errorQuda("Vector type not supported\n");
     if (vecLength<StoreType>() == 0) errorQuda("Vector type not supported\n");

   }

   template <typename FloatN, int M>
   __device__ inline float store_norm(float *norm, FloatN x[M], int i) {
     float c[M];
 #pragma unroll
     for (int j=0; j<M; j++) c[j] = max_fabs(x[j]);
 #pragma unroll
     for (int j=1; j<M; j++) c[0] = fmaxf(c[j],c[0]);
     norm[i] = c[0];
     return __fdividef(MAX_SHORT, c[0]);
   }

 template <typename RegType, typename StoreType, int N, int tex_id=-1>
   class SpinorTexture {

   typedef typename bridge_mapper<RegType,StoreType>::type InterType;

   protected:
 #ifdef USE_TEXTURE_OBJECTS // texture objects
     Texture<InterType, StoreType> tex;
     Texture<InterType, StoreType> ghostTex;
 #else
     StoreType *spinor;
     StoreType *ghost_spinor;
     Texture<InterType, StoreType, tex_id> tex;
     Texture<InterType, StoreType, -1> ghostTex;
 #endif
     float *norm; // always use direct reads for norm

     int stride;
     unsigned int cb_offset;
     unsigned int cb_norm_offset;
 #ifndef BLAS_SPINOR
     int ghost_stride[4];
 #endif

   public:
     SpinorTexture() :
 #ifndef USE_TEXTURE_OBJECTS
     spinor(0), ghost_spinor(0),
 #endif
   tex(), ghostTex(), norm(0), stride(0), cb_offset(0), cb_norm_offset(0) { } // default constructor

     // Spinor must only ever called with cudaColorSpinorField references!!!!
     SpinorTexture(const ColorSpinorField &x, int nFace=1) :
 #ifndef USE_TEXTURE_OBJECTS
     spinor((StoreType*)x.V()), ghost_spinor((StoreType*)x.Ghost2()),
 #endif
     tex(&(static_cast<const cudaColorSpinorField&>(x))),
     ghostTex(&(static_cast<const cudaColorSpinorField&>(x)), true),
     norm((float*)x.Norm()), stride(x.Stride()),
     cb_offset(x.Bytes()/(2*sizeof(StoreType))),
     cb_norm_offset(x.NormBytes()/(2*sizeof(float)))
     {
       checkTypes<RegType,InterType,StoreType>();
 #ifndef BLAS_SPINOR
       for (int d=0; d<4; d++) ghost_stride[d] = nFace*x.SurfaceCB(d);
 #endif
     }

     SpinorTexture(const SpinorTexture &st) :
 #ifndef USE_TEXTURE_OBJECTS
     spinor(st.spinor), ghost_spinor(st.ghost_spinor),
 #endif
     tex(st.tex), ghostTex(st.ghostTex), norm(st.norm), stride(st.stride),
     cb_offset(st.cb_offset), cb_norm_offset(st.cb_norm_offset)
       {
 #ifndef BLAS_SPINOR
   for (int d=0; d<4; d++) ghost_stride[d] = st.ghost_stride[d];
 #endif
       }

     SpinorTexture& operator=(const SpinorTexture &src) {
       if (&src != this) {
 #ifndef USE_TEXTURE_OBJECTS
   spinor = src.spinor;
         ghost_spinor = src.ghost_spinor;
 #endif
   tex = src.tex;
         ghostTex = src.ghostTex;
   norm = src.norm;
   stride = src.stride;
   cb_offset = src.cb_offset;
   cb_norm_offset = src.cb_norm_offset;
 #ifndef BLAS_SPINOR
   for (int d=0; d<4; d++) ghost_stride[d] = src.ghost_stride[d];
 #endif
       }
       return *this;
     }

   void set(const cudaColorSpinorField &x, int nFace=1){
 #ifdef USE_TEXTURE_OBJECTS
       tex = Texture<InterType, StoreType>(&x);
       ghostTex = Texture<InterType, StoreType>(&x,true);
 #else
       spinor = (StoreType*)x.V();
       ghost_spinor = (StoreType*)x.Ghost2();
       tex = Texture<InterType, StoreType, tex_id>(&x);
       ghostTex = Texture<InterType, StoreType, -1>(&x,true);
 #endif
       norm = (float*)x.Norm();
       stride = x.Stride();
       cb_offset = x.Bytes()/(2*sizeof(StoreType));
       cb_norm_offset = x.NormBytes()/(2*sizeof(float));
 #ifndef BLAS_SPINOR
       for (int d=0; d<4; d++) ghost_stride[d] = nFace*x.SurfaceCB(d);
 #endif
       checkTypes<RegType,InterType,StoreType>();
     }

     virtual ~SpinorTexture() { }

   __device__ inline void load(RegType x[], const int i, const int parity=0) {
       // load data into registers first using the storage order
       constexpr int M = (N * vec_length<RegType>::value ) / vec_length<InterType>::value;
       InterType y[M];

       // If we are using tex references, then we can only use the predeclared texture ids
 #ifndef USE_TEXTURE_OBJECTS
       if (tex_id >= 0 && tex_id <= MAX_TEX_ID) {
 #endif
   // half precision types
   if ( isHalf<StoreType>::value ) {
     float xN = norm[cb_norm_offset*parity + i];
 #pragma unroll
     for (int j=0; j<M; j++) y[j] = xN*tex[cb_offset*parity + i + j*stride];
   } else { // other types
 #pragma unroll
     for (int j=0; j<M; j++) copyFloatN(y[j], tex[cb_offset*parity + i + j*stride]);
   }
 #ifndef USE_TEXTURE_OBJECTS
       } else { // default load when out of tex_id range

   if ( isHalf<StoreType>::value ) {
     float xN = norm[cb_norm_offset*parity + i];
 #pragma unroll
     for (int j=0; j<M; j++) {
       copyFloatN(y[j], spinor[cb_offset*parity + i + j*stride]);
       y[j] *= xN;
     }
   } else { // other types
 #pragma unroll
     for (int j=0; j<M; j++) copyFloatN(y[j],spinor[cb_offset*parity + i + j*stride]);
   }
       }
 #endif // !USE_TEXTURE_OBJECTS

       // now convert into desired register order
       convert<RegType, InterType>(x, y, N);
     }

 #ifndef BLAS_SPINOR

   __device__ inline void loadGhost(RegType x[], const int i, const int dim) {
     // load data into registers first using the storage order
     const int Nspin = (N * vec_length<RegType>::value) / (3 * 2);
     // if Wilson, then load only half the number of components
     constexpr int M = ((N * vec_length<RegType>::value ) / vec_length<InterType>::value) / ((Nspin == 4) ? 2 : 1);

     InterType y[M];

     // If we are using tex references, then we can only use the predeclared texture ids
 #ifndef USE_TEXTURE_OBJECTS
     if (tex_id >= 0 && tex_id <= MAX_TEX_ID) {
 #endif
       // half precision types (FIXME - these don't look correct?)
       if ( isHalf<StoreType>::value ) {
   float xN = norm[i];
 #pragma unroll
   for (int j=0; j<M; j++) y[j] = xN*ghostTex[i + j*ghost_stride[dim]];
       } else { // other types
 #pragma unroll
   for (int j=0; j<M; j++) copyFloatN(y[j], ghostTex[i + j*ghost_stride[dim]]);
       }
 #ifndef USE_TEXTURE_OBJECTS
     } else { // default load when out of tex_id range

       if ( isHalf<StoreType>::value ) {
   float xN = norm[i];
 #pragma unroll
   for (int j=0; j<M; j++) {
     copyFloatN(y[j], ghost_spinor[i + j*ghost_stride[dim]]);
     y[j] *= xN;
   }
       } else { // other types
 #pragma unroll
   for (int j=0; j<M; j++) copyFloatN(y[j],ghost_spinor[i + j*ghost_stride[dim]]);
       }
     }
 #endif // !USE_TEXTURE_OBJECTS

     // now convert into desired register order
     convert<RegType, InterType>(x, y, N);
   }
 #endif

     QudaPrecision Precision() const {
       QudaPrecision precision = QUDA_INVALID_PRECISION;
       if (sizeof(((StoreType*)0)->x) == sizeof(double)) precision = QUDA_DOUBLE_PRECISION;
       else if (sizeof(((StoreType*)0)->x) == sizeof(float)) precision = QUDA_SINGLE_PRECISION;
       else if (sizeof(((StoreType*)0)->x) == sizeof(short)) precision = QUDA_HALF_PRECISION;
       else errorQuda("Unknown precision type\n");
       return precision;
     }

     int Stride() const { return stride; }
     int Bytes() const { return N*sizeof(RegType); }
   };

 template <typename RegType, typename StoreType, int N, int write, int tex_id=-1>
     class Spinor : public SpinorTexture<RegType,StoreType,N,tex_id> {

   typedef typename bridge_mapper<RegType,StoreType>::type InterType;
   typedef SpinorTexture<RegType,StoreType,N,tex_id> ST;

   private:
 #ifdef USE_TEXTURE_OBJECTS
     StoreType *spinor;
     StoreType *ghost_spinor;
 #define SPINOR spinor
 #else
 #define SPINOR ST::spinor
 #endif
   public:
   Spinor() : ST()
 #ifdef USE_TEXTURE_OBJECTS
     , spinor(0), ghost_spinor(0)
 #endif
     {} // default constructor

     // Spinor must only ever called with cudaColorSpinorField references!!!!
   Spinor(const ColorSpinorField &x, int nFace=1) : ST(x, nFace)
 #ifdef USE_TEXTURE_OBJECTS
     , spinor((StoreType*)x.V()), ghost_spinor((StoreType*)x.Ghost2())
 #endif
     {}

     Spinor(const Spinor &st) : ST(st)
 #ifdef USE_TEXTURE_OBJECTS
     , spinor(st.spinor), ghost_spinor(st.ghost_spinor)
 #endif
     {}

     Spinor& operator=(const Spinor &src) {
       ST::operator=(src);
       if (&src != this) {
 #ifdef USE_TEXTURE_OBJECTS
   spinor = src.spinor;
         ghost_spinor = src.ghost_spinor;
 #endif
       }
       return *this;
     }

     void set(const cudaColorSpinorField &x){
       ST::set(x);
 #ifdef USE_TEXTURE_OBJECTS
       spinor = (StoreType*)x.V();
       ghost_spinor = (StoreType*)x.Ghost2();
 #endif
     }

     ~Spinor() { }

     // default store used for simple fields
   __device__ inline void save(RegType x[], int i, const int parity = 0) {
       if (write) {
   constexpr int M = (N * vec_length<RegType>::value ) / vec_length<InterType>::value;
   InterType y[M];
   convert<InterType, RegType>(y, x, M);

   if ( isHalf<StoreType>::value ) {
           float C = store_norm<InterType, M>(ST::norm, y, ST::cb_norm_offset*parity + i);
 #pragma unroll
           for (int j=0; j<M; j++) copyFloatN(SPINOR[ST::cb_offset*parity + i + j*ST::stride], C*y[j]);
   } else {
 #pragma unroll
           for (int j=0; j<M; j++) copyFloatN(SPINOR[ST::cb_offset*parity + i + j*ST::stride], y[j]);
   }
       }
     }

     // used to backup the field to the host
     void backup(char **spinor_h, char **norm_h, size_t bytes, size_t norm_bytes) {
       if (write) {
   *spinor_h = new char[bytes];
   cudaMemcpy(*spinor_h, SPINOR, bytes, cudaMemcpyDeviceToHost);
   if (norm_bytes > 0) {
     *norm_h = new char[norm_bytes];
           cudaMemcpy(*norm_h, ST::norm, norm_bytes, cudaMemcpyDeviceToHost);
   }
   checkCudaError();
       }
     }

     // restore the field from the host
     void restore(char **spinor_h, char **norm_h, size_t bytes, size_t norm_bytes) {
       if (write) {
   cudaMemcpy(SPINOR, *spinor_h, bytes, cudaMemcpyHostToDevice);
   if (norm_bytes > 0) {
           cudaMemcpy(ST::norm, *norm_h, norm_bytes, cudaMemcpyHostToDevice);
     delete []*norm_h;
     *norm_h = 0;
   }
   delete []*spinor_h;
   *spinor_h = 0;
   checkCudaError();
       }
     }

     void* V() { return (void*)SPINOR; }
     float* Norm() { return ST::norm; }
   };


 #ifndef USE_TEXTURE_OBJECTS
 #undef MAX_TEX_ID
 #endif

 #endif // _TEXTURE_H
SpinorTexture::Bytes
int Bytes() const
Definition: texture.h:516

QudaPrecision
enum QudaPrecision_s QudaPrecision

SPINOR
#define SPINOR
Definition: texture.h:539

Spinor::Norm
float * Norm()
Definition: texture.h:629

quda::norm
__host__ __device__ ValueType norm(const complex< ValueType > &z)
Returns the magnitude of z squared.
Definition: complex_quda.h:896

Texture::~Texture
~Texture()
Definition: texture.h:146

QUDA_INVALID_PRECISION
Definition: enum_quda.h:62

src
const void * src
Definition: CMakeCUDACompilerId.cpp1.ii:2290

errorQuda
#define errorQuda(...)
Definition: util_quda.h:90

SpinorTexture::cb_offset
unsigned int cb_offset
Definition: texture.h:336

Texture::Texture
Texture(const cudaColorSpinorField *x, bool use_ghost=false)
Definition: texture.h:120

QUDA_HALF_PRECISION
Definition: enum_quda.h:59

Spinor::~Spinor
~Spinor()
Definition: texture.h:580

SpinorTexture::SpinorTexture
SpinorTexture(const SpinorTexture &st)
Definition: texture.h:366

dim
static __inline__ dim3 dim3 void size_t cudaStream_t int dim
Definition: CMakeCUDACompilerId.cpp1.ii:15687

DEF_ALL
#define DEF_ALL(id)
Definition: texture.h:228

Spinor::V
void * V()
Definition: texture.h:628

Spinor::InterType
bridge_mapper< RegType, StoreType >::type InterType
Definition: texture.h:530

SpinorTexture::ghostTex
Texture< InterType, StoreType, -1 > ghostTex
Definition: texture.h:331

SpinorTexture::InterType
bridge_mapper< RegType, StoreType >::type InterType
Definition: texture.h:321

Nspin
int Nspin
Definition: blas_test.cu:45

fetch_double
__inline__ __device__ double fetch_double(texture< int2, 1 > t, int i)
Definition: texture.h:86

SpinorTexture::load
__device__ void load(RegType x[], const int i, const int parity=0)
Definition: texture.h:419

Texture::unbind
void unbind()
Definition: texture.h:161

SpinorTexture::ghost_spinor
StoreType * ghost_spinor
Definition: texture.h:329

SpinorTexture::Precision
QudaPrecision Precision() const
Definition: texture.h:506

x
p x
Definition: CMakeCUDACompilerId.cpp1.ii:3011

Spinor::ST
SpinorTexture< RegType, StoreType, N, tex_id > ST
Definition: texture.h:531

copyFloatN
__device__ void copyFloatN(FloatN &a, const FloatN &b)
Definition: convert.h:33

SpinorTexture::spinor
StoreType * spinor
Definition: texture.h:328

Spinor::Spinor
Spinor(const ColorSpinorField &x, int nFace=1)
Definition: texture.h:549

SpinorTexture::Stride
int Stride() const
Definition: texture.h:515

V
int V
Definition: test_util.cpp:28

fused_exterior_ndeg_tm_dslash_cuda_gen.i
int i
start here
Definition: fused_exterior_ndeg_tm_dslash_cuda_gen.py:816

SpinorTexture::ghost_stride
int ghost_stride[4]
Definition: texture.h:339

fmaxf
float fmaxf(float, float)

store_norm
__device__ float store_norm(float *norm, FloatN x[M], int i)
Definition: texture.h:300

SpinorTexture::loadGhost
__device__ void loadGhost(RegType x[], const int i, const int dim)
Definition: texture.h:463

SpinorTexture::stride
int stride
Definition: texture.h:335

checkTypes
void checkTypes()
Definition: texture.h:279

fetch_double2
__inline__ __device__ double2 fetch_double2(texture< int4, 1 > t, int i)
Definition: texture.h:88

Texture::Texture
Texture(const Texture &tex)
Definition: texture.h:140

t
return t
Definition: CMakeCUDACompilerId.cpp1.ii:3149

Texture::bound
static bool bound
Definition: texture.h:110

Texture
Definition: texture.h:103

Spinor::restore
void restore(char **spinor_h, char **norm_h, size_t bytes, size_t norm_bytes)
Definition: texture.h:614

Spinor::backup
void backup(char **spinor_h, char **norm_h, size_t bytes, size_t norm_bytes)
Definition: texture.h:601

SpinorTexture
Definition: texture.h:319

Texture::count
static int count
Definition: texture.h:111

QUDA_DOUBLE_PRECISION
Definition: enum_quda.h:61

Texture::Texture
Texture()
Definition: texture.h:114

Spinor::operator=
Spinor & operator=(const Spinor &src)
Definition: texture.h:561

out
cpuColorSpinorField * out
Definition: staggered_invert_test.cpp:45

SpinorTexture::norm
float * norm
Definition: texture.h:333

idx
int idx
Definition: staggered_fused_exterior_dslash_core.h:355

SpinorTexture::SpinorTexture
SpinorTexture()
Definition: texture.h:343

QUDA_SINGLE_PRECISION
Definition: enum_quda.h:60

quda::mapper
Definition: register_traits.h:41

SpinorTexture::cb_norm_offset
unsigned int cb_norm_offset
Definition: texture.h:337

Spinor::Spinor
Spinor(const Spinor &st)
Definition: texture.h:555

SpinorTexture::SpinorTexture
SpinorTexture(const ColorSpinorField &x, int nFace=1)
Definition: texture.h:350

tex
static __inline__ dim3 dim3 void size_t cudaStream_t int enum cudaTextureReadMode readMode static __inline__ const struct texture< T, dim, readMode > & tex
Definition: CMakeCUDACompilerId.cpp1.ii:15874

quda::max_fabs
__forceinline__ __host__ __device__ float max_fabs(const float4 &c)
Definition: float_vector.h:198

SpinorTexture::set
void set(const cudaColorSpinorField &x, int nFace=1)
Definition: texture.h:397

c
const void * c
Definition: CMakeCUDACompilerId.cpp1.ii:2234

MAX_SHORT
#define MAX_SHORT
Definition: quda_internal.h:29

Spinor
Definition: texture.h:528

Texture::operator=
Texture & operator=(const Texture &tex)
Definition: texture.h:152

Texture::operator[]
__device__ OutputType operator[](unsigned int idx)
Definition: texture.h:165

checkCudaError
#define checkCudaError()
Definition: util_quda.h:129

SpinorTexture::~SpinorTexture
virtual ~SpinorTexture()
Definition: texture.h:417

float
float
Definition: CMakeCUDACompilerId.cpp1.ii:12791

Spinor::Spinor
Spinor()
Definition: texture.h:542

value
int value
Definition: CMakeCUDACompilerId.cpp1.ii:2296

d
static __inline__ size_t size_t d
Definition: CMakeCUDACompilerId.cpp1.ii:3019

SpinorTexture::tex
Texture< InterType, StoreType, tex_id > tex
Definition: texture.h:330

parity
QudaParity parity
Definition: covdev_test.cpp:53

convert.h

Texture::fetch
__device__ OutputType fetch(unsigned int idx)
Definition: texture.h:164

spinor
cpuColorSpinorField * spinor
Definition: covdev_test.cpp:41

quda::blas::bytes
unsigned long long bytes
Definition: blas_quda.cu:43

tex_id_table
bool tex_id_table[MAX_TEX_ID]
Definition: texture.h:100

Texture::bind
void bind(const InputType *, size_t bytes)
Definition: texture.h:160

MAX_TEX_ID
#define MAX_TEX_ID
Definition: texture.h:97

SpinorTexture::operator=
SpinorTexture & operator=(const SpinorTexture &src)
Definition: texture.h:378

Spinor::save
__device__ void save(RegType x[], int i, const int parity=0)
Definition: texture.h:583

y
int y
Definition: CMakeCUDACompilerId.cpp1.ii:2637