quda-ref/v1.0.0/register__traits_8h_source.html

 #ifndef _REGISTER_TRAITS_H
 #define _REGISTER_TRAITS_H

 #include <quda_internal.h>
 #include <convert.h>
 #include <generics/ldg.h>
 #include <complex_quda.h>
 #include <inline_ptx.h>

 namespace quda {

   /*
     Here we use traits to define the greater type used for mixing types of computation involving these types
   */
   template<class T, class U> struct PromoteTypeId { typedef T Type; };
   template<> struct PromoteTypeId<complex<float>, float> { typedef complex<float> Type; };
   template<> struct PromoteTypeId<float, complex<float> > { typedef complex<float> Type; };
   template<> struct PromoteTypeId<complex<double>, double> { typedef complex<double> Type; };
   template<> struct PromoteTypeId<double, complex<double> > { typedef complex<double> Type; };
   template<> struct PromoteTypeId<double,int> { typedef double Type; };
   template<> struct PromoteTypeId<int,double> { typedef double Type; };
   template<> struct PromoteTypeId<float,int> { typedef float Type; };
   template<> struct PromoteTypeId<int,float> { typedef float Type; };
   template<> struct PromoteTypeId<double,float> { typedef double Type; };
   template<> struct PromoteTypeId<float,double> { typedef double Type; };

   /*
     Here we use traits to define the mapping between storage type and
     register type:
     double -> double
     float -> float
     short -> float
     quarter -> float
     This allows us to wrap the encapsulate the register type into the storage template type
    */
   template<typename> struct mapper { };
   template<> struct mapper<double> { typedef double type; };
   template<> struct mapper<float> { typedef float type; };
   template<> struct mapper<short> { typedef float type; };
   template<> struct mapper<char> { typedef float type; };

   template<> struct mapper<double2> { typedef double2 type; };
   template<> struct mapper<float2> { typedef float2 type; };
   template<> struct mapper<short2> { typedef float2 type; };
   template<> struct mapper<char2> { typedef float2 type; };

   template<> struct mapper<double4> { typedef double4 type; };
   template<> struct mapper<float4> { typedef float4 type; };
   template<> struct mapper<short4> { typedef float4 type; };
   template<> struct mapper<char4> { typedef float4 type; };

   template<typename,typename> struct bridge_mapper { };
   template<> struct bridge_mapper<double2,double2> { typedef double2 type; };
   template<> struct bridge_mapper<double2,float2> { typedef double2 type; };
   template<> struct bridge_mapper<double2,short2> { typedef float2 type; };
   template<> struct bridge_mapper<double2,char2> { typedef float2 type; };
   template<> struct bridge_mapper<double2,float4> { typedef double4 type; };
   template<> struct bridge_mapper<double2,short4> { typedef float4 type; };
   template<> struct bridge_mapper<double2,char4> { typedef float4 type; };
   template<> struct bridge_mapper<float4,double2> { typedef float2 type; };
   template<> struct bridge_mapper<float4,float4> { typedef float4 type; };
   template<> struct bridge_mapper<float4,short4> { typedef float4 type; };
   template<> struct bridge_mapper<float4,char4> { typedef float4 type; };
   template<> struct bridge_mapper<float2,double2> { typedef float2 type; };
   template<> struct bridge_mapper<float2,float2> { typedef float2 type; };
   template<> struct bridge_mapper<float2,short2> { typedef float2 type; };
   template<> struct bridge_mapper<float2,char2> { typedef float2 type; };

   template<typename> struct vec_length { static const int value = 0; };
   template<> struct vec_length<double4> { static const int value = 4; };
   template<> struct vec_length<double2> { static const int value = 2; };
   template<> struct vec_length<double> { static const int value = 1; };
   template<> struct vec_length<float4> { static const int value = 4; };
   template<> struct vec_length<float2> { static const int value = 2; };
   template<> struct vec_length<float> { static const int value = 1; };
   template<> struct vec_length<short4> { static const int value = 4; };
   template<> struct vec_length<short2> { static const int value = 2; };
   template<> struct vec_length<short> { static const int value = 1; };
   template<> struct vec_length<char4> { static const int value = 4; };
   template<> struct vec_length<char2> { static const int value = 2; };
   template<> struct vec_length<char> { static const int value = 1; };

   template<typename, int N> struct vector { };

   template<> struct vector<double, 2> {
     typedef double2 type;
     type a;
     vector(const type &a) { this->a.x = a.x; this->a.y = a.y; }
     operator type() const { return a; }
   };

   template<> struct vector<float, 2> {
     typedef float2 type;
     float2 a;
     vector(const double2 &a) { this->a.x = a.x; this->a.y = a.y; }
     operator type() const { return a; }
   };

   template<> struct vector<int, 2> {
     typedef int2 type;
     int2 a;
     vector(const int2 &a) { this->a.x = a.x; this->a.y = a.y; }
     operator type() const { return a; }
   };

   template<typename> struct scalar { };
   template<> struct scalar<double4> { typedef double type; };
   template<> struct scalar<double3> { typedef double type; };
   template<> struct scalar<double2> { typedef double type; };
   template<> struct scalar<double> { typedef double type; };
   template<> struct scalar<float4> { typedef float type; };
   template<> struct scalar<float3> { typedef float type; };
   template<> struct scalar<float2> { typedef float type; };
   template<> struct scalar<float> { typedef float type; };
   template<> struct scalar<short4> { typedef short type; };
   template<> struct scalar<short3> { typedef short type; };
   template<> struct scalar<short2> { typedef short type; };
   template<> struct scalar<short> { typedef short type; };
   template<> struct scalar<char4> { typedef char type; };
   template<> struct scalar<char3> { typedef char type; };
   template<> struct scalar<char2> { typedef char type; };
   template<> struct scalar<char> { typedef char type; };

   /* Traits used to determine if a variable is half precision or not */
   template< typename T > struct isHalf{ static const bool value = false; };
   template<> struct isHalf<short>{ static const bool value = true; };
   template<> struct isHalf<short2>{ static const bool value = true; };
   template<> struct isHalf<short4>{ static const bool value = true; };

   /* Traits used to determine if a variable is quarter precision or not */
   template< typename T > struct isQuarter{ static const bool value = false; };
   template<> struct isQuarter<char>{ static const bool value = true; };
   template<> struct isQuarter<char2>{ static const bool value = true; };
   template<> struct isQuarter<char4>{ static const bool value = true; };

   /* Traits used to determine if a variable is fixed precision or not */
   template< typename T > struct isFixed{ static const bool value = false; };
   template<> struct isFixed<short>{ static const bool value = true; };
   template<> struct isFixed<short2>{ static const bool value = true; };
   template<> struct isFixed<short4>{ static const bool value = true; };
   template<> struct isFixed<char>{ static const bool value = true; };
   template<> struct isFixed<char2>{ static const bool value = true; };
   template<> struct isFixed<char4>{ static const bool value = true; };

   template<typename T1, typename T2> __host__ __device__ inline void copy (T1 &a, const T2 &b) { a = b; }

   template<> __host__ __device__ inline void copy(double &a, const int2 &b) {
 #ifdef __CUDA_ARCH__
     a = __hiloint2double(b.y, b.x);
 #else
     errorQuda("Undefined");
 #endif
   }

   template<> __host__ __device__ inline void copy(double2 &a, const int4 &b) {
 #ifdef __CUDA_ARCH__
     a.x = __hiloint2double(b.y, b.x); a.y = __hiloint2double(b.w, b.z);
 #else
     errorQuda("Undefined");
 #endif
   }

   template<> __host__ __device__ inline void copy(float &a, const short &b) { a = s2f(b); }
   template<> __host__ __device__ inline void copy(short &a, const float &b) { a = f2i(b*fixedMaxValue<short>::value); }

   template<> __host__ __device__ inline void copy(float2 &a, const short2 &b) {
     a.x = s2f(b.x); a.y = s2f(b.y);
   }

   template<> __host__ __device__ inline void copy(short2 &a, const float2 &b) {
     a.x = f2i(b.x*fixedMaxValue<short>::value); a.y = f2i(b.y*fixedMaxValue<short>::value);
   }

   template<> __host__ __device__ inline void copy(float4 &a, const short4 &b) {
     a.x = s2f(b.x); a.y = s2f(b.y); a.z = s2f(b.z); a.w = s2f(b.w);
   }

   template<> __host__ __device__ inline void copy(short4 &a, const float4 &b) {
     a.x = f2i(b.x*fixedMaxValue<short>::value); a.y = f2i(b.y*fixedMaxValue<short>::value); a.z = f2i(b.z*fixedMaxValue<short>::value); a.w = f2i(b.w*fixedMaxValue<short>::value);
   }

   template<> __host__ __device__ inline void copy(float &a, const char &b) { a = c2f(b); }
   template<> __host__ __device__ inline void copy(char &a, const float &b) { a = f2i(b*fixedMaxValue<char>::value); }

   template<> __host__ __device__ inline void copy(float2 &a, const char2 &b) {
     a.x = c2f(b.x); a.y = c2f(b.y);
   }

   template<> __host__ __device__ inline void copy(char2 &a, const float2 &b) {
     a.x = f2i(b.x*fixedMaxValue<char>::value); a.y = f2i(b.y*fixedMaxValue<char>::value);
   }

   template<> __host__ __device__ inline void copy(float4 &a, const char4 &b) {
     a.x = c2f(b.x); a.y = c2f(b.y); a.z = c2f(b.z); a.w = c2f(b.w);
   }

   template<> __host__ __device__ inline void copy(char4 &a, const float4 &b) {
     a.x = f2i(b.x*fixedMaxValue<char>::value); a.y = f2i(b.y*fixedMaxValue<char>::value); a.z = f2i(b.z*fixedMaxValue<char>::value); a.w = f2i(b.w*fixedMaxValue<char>::value);
   }

   // specialized variants of the copy function that assumes fixed-point scaling already done
   template <typename T1, typename T2> __host__ __device__ inline void copy_scaled(T1 &a, const T2 &b) { copy(a, b); }

   template <> __host__ __device__ inline void copy_scaled(short4 &a, const float4 &b)
   {
     a.x = f2i(b.x);
     a.y = f2i(b.y);
     a.z = f2i(b.z);
     a.w = f2i(b.w);
   }

   template <> __host__ __device__ inline void copy_scaled(char4 &a, const float4 &b)
   {
     a.x = f2i(b.x);
     a.y = f2i(b.y);
     a.z = f2i(b.z);
     a.w = f2i(b.w);
   }

   template <> __host__ __device__ inline void copy_scaled(short2 &a, const float2 &b)
   {
     a.x = f2i(b.x);
     a.y = f2i(b.y);
   }

   template <> __host__ __device__ inline void copy_scaled(char2 &a, const float2 &b)
   {
     a.x = f2i(b.x);
     a.y = f2i(b.y);
   }

   template <> __host__ __device__ inline void copy_scaled(short &a, const float &b) { a = f2i(b); }

   template <> __host__ __device__ inline void copy_scaled(char &a, const float &b) { a = f2i(b); }

   template <typename T1, typename T2, typename T3>
   __host__ __device__ inline void copy_and_scale(T1 &a, const T2 &b, const T3 &c)
   {
     copy(a, b);
   }

   template <> __host__ __device__ inline void copy_and_scale(float4 &a, const short4 &b, const float &c)
   {
     a.x = s2f(b.x, c);
     a.y = s2f(b.y, c);
     a.z = s2f(b.z, c);
     a.w = s2f(b.w, c);
   }

   template <> __host__ __device__ inline void copy_and_scale(float4 &a, const char4 &b, const float &c)
   {
     a.x = c2f(b.x, c);
     a.y = c2f(b.y, c);
     a.z = c2f(b.z, c);
     a.w = c2f(b.w, c);
   }

   template <> __host__ __device__ inline void copy_and_scale(float2 &a, const short2 &b, const float &c)
   {
     a.x = s2f(b.x, c);
     a.y = s2f(b.y, c);
   }

   template <> __host__ __device__ inline void copy_and_scale(float2 &a, const char2 &b, const float &c)
   {
     a.x = c2f(b.x, c);
     a.y = c2f(b.y, c);
   }

   template <> __host__ __device__ inline void copy_and_scale(float &a, const short &b, const float &c)
   {
     a = s2f(b, c);
   }

   template <> __host__ __device__ inline void copy_and_scale(float &a, const char &b, const float &c) { a = c2f(b, c); }

   template <bool isFixed, typename T>
     struct Trig {
       __device__ __host__ static T Atan2( const T &a, const T &b) { return atan2(a,b); }
       __device__ __host__ static T Sin( const T &a ) { return sin(a); }
       __device__ __host__ static T Cos( const T &a ) { return cos(a); }
       __device__ __host__ static void SinCos(const T &a, T *s, T *c) { sincos(a, s, c); }
     };

   template <>
     struct Trig<false,float> {
     __device__ __host__ static float Atan2( const float &a, const float &b) { return atan2f(a,b); }
     __device__ __host__ static float Sin(const float &a)
     {
 #ifdef __CUDA_ARCH__
       return __sinf(a);
 #else
       return sinf(a);
 #endif
     }
     __device__ __host__ static float Cos(const float &a)
     {
 #ifdef __CUDA_ARCH__
       return __cosf(a);
 #else
       return cosf(a);
 #endif
     }

     __device__ __host__ static void SinCos(const float &a, float *s, float *c)
     {
 #ifdef __CUDA_ARCH__
        __sincosf(a, s, c);
 #else
        sincosf(a, s, c);
 #endif
     }
   };

   template <>
     struct Trig<true,float> {
     __device__ __host__ static float Atan2( const float &a, const float &b) { return atan2f(a,b)/M_PI; }
     __device__ __host__ static float Sin(const float &a)
     {
 #ifdef __CUDA_ARCH__
       return __sinf(a * static_cast<float>(M_PI));
 #else
       return sinf(a * static_cast<float>(M_PI));
 #endif
     }
     __device__ __host__ static float Cos(const float &a)
     {
 #ifdef __CUDA_ARCH__
       return __cosf(a * static_cast<float>(M_PI));
 #else
       return cosf(a * static_cast<float>(M_PI));
 #endif
     }

     __device__ __host__ static void SinCos(const float &a, float *s, float *c)
     {
 #ifdef __CUDA_ARCH__
       __sincosf(a * static_cast<float>(M_PI), s, c);
 #else
       sincosf(a * static_cast<float>(M_PI), s, c);
 #endif
     }
   };


   template <typename Float, int number> struct VectorType;

   // double precision
   template <> struct VectorType<double, 1>{typedef double type; };
   template <> struct VectorType<double, 2>{typedef double2 type; };
   template <> struct VectorType<double, 4>{typedef double4 type; };

   // single precision
   template <> struct VectorType<float, 1>{typedef float type; };
   template <> struct VectorType<float, 2>{typedef float2 type; };
   template <> struct VectorType<float, 4>{typedef float4 type; };

   // half precision
   template <> struct VectorType<short, 1>{typedef short type; };
   template <> struct VectorType<short, 2>{typedef short2 type; };
   template <> struct VectorType<short, 4>{typedef short4 type; };

   // quarter precision
   template <> struct VectorType<char, 1>{typedef char type; };
   template <> struct VectorType<char, 2>{typedef char2 type; };
   template <> struct VectorType<char, 4>{typedef char4 type; };

   // This trait returns the matching texture type (needed for double precision)
   template <typename Float, int number> struct TexVectorType;

   // double precision
   template <> struct TexVectorType<double, 1>{typedef int2 type; };
   template <> struct TexVectorType<double, 2>{typedef int4 type; };

   // single precision
   template <> struct TexVectorType<float, 1>{typedef float type; };
   template <> struct TexVectorType<float, 2>{typedef float2 type; };
   template <> struct TexVectorType<float, 4>{typedef float4 type; };

   // half precision
   template <> struct TexVectorType<short, 1>{typedef short type; };
   template <> struct TexVectorType<short, 2>{typedef short2 type; };
   template <> struct TexVectorType<short, 4>{typedef short4 type; };

   // quarter precision
   template <> struct TexVectorType<char, 1>{typedef char type; };
   template <> struct TexVectorType<char, 2>{typedef char2 type; };
   template <> struct TexVectorType<char, 4>{typedef char4 type; };

   template <typename VectorType>
     __device__ __host__ inline VectorType vector_load(void *ptr, int idx) {
 #define USE_LDG
 #if defined(__CUDA_ARCH__) && defined(USE_LDG)
     return __ldg(reinterpret_cast< VectorType* >(ptr) + idx);
 #else
     return reinterpret_cast< VectorType* >(ptr)[idx];
 #endif
   }

   template <typename VectorType>
     __device__ __host__ inline void vector_store(void *ptr, int idx, const VectorType &value) {
     reinterpret_cast< VectorType* >(ptr)[idx] = value;
   }

   template <>
     __device__ __host__ inline void vector_store(void *ptr, int idx, const double2 &value) {
 #if defined(__CUDA_ARCH__)
     store_streaming_double2(reinterpret_cast<double2*>(ptr)+idx, value.x, value.y);
 #else
     reinterpret_cast<double2*>(ptr)[idx] = value;
 #endif
   }

   template <>
     __device__ __host__ inline void vector_store(void *ptr, int idx, const float4 &value) {
 #if defined(__CUDA_ARCH__)
     store_streaming_float4(reinterpret_cast<float4*>(ptr)+idx, value.x, value.y, value.z, value.w);
 #else
     reinterpret_cast<float4*>(ptr)[idx] = value;
 #endif
   }

   template <>
     __device__ __host__ inline void vector_store(void *ptr, int idx, const float2 &value) {
 #if defined(__CUDA_ARCH__)
     store_streaming_float2(reinterpret_cast<float2*>(ptr)+idx, value.x, value.y);
 #else
     reinterpret_cast<float2*>(ptr)[idx] = value;
 #endif
   }

   template <>
     __device__ __host__ inline void vector_store(void *ptr, int idx, const short4 &value) {
 #if defined(__CUDA_ARCH__)
     store_streaming_short4(reinterpret_cast<short4*>(ptr)+idx, value.x, value.y, value.z, value.w);
 #else
     reinterpret_cast<short4*>(ptr)[idx] = value;
 #endif
   }

   template <>
     __device__ __host__ inline void vector_store(void *ptr, int idx, const short2 &value) {
 #if defined(__CUDA_ARCH__)
     store_streaming_short2(reinterpret_cast<short2*>(ptr)+idx, value.x, value.y);
 #else
     reinterpret_cast<short2*>(ptr)[idx] = value;
 #endif
   }

   // A char4 is the same size as a short2
   template <>
     __device__ __host__ inline void vector_store(void *ptr, int idx, const char4 &value) {
 #if defined(__CUDA_ARCH__)

     store_streaming_short2(reinterpret_cast<short2*>(ptr)+idx, reinterpret_cast<const short2*>(&value)->x, reinterpret_cast<const short2*>(&value)->y);
 #else
     reinterpret_cast<char4*>(ptr)[idx] = value;
     //reinterpret_cast<short2*>(ptr)[idx] = *reinterpret_cast<const short2*>(&value);
 #endif
   }

   template <>
     __device__ __host__ inline void vector_store(void *ptr, int idx, const char2 &value) {
 #if defined(__CUDA_ARCH__)
     vector_store(ptr, idx, *reinterpret_cast<const short*>(&value));
     //store_streaming_char2(reinterpret_cast<char2*>(ptr)+idx, reinterpret_cast<const char2*>(&value)->x, reinterpret_cast<const char2*>(&value)->y);
 #else
     reinterpret_cast<char2*>(ptr)[idx] = value;
 #endif
   }

   template<bool large_alloc> struct AllocType { };
   template<> struct AllocType<true> { typedef size_t type; };
   template<> struct AllocType<false> { typedef int type; };

 } // namespace quda

 #endif // _REGISTER_TRAITS_H
quda::TexVectorType< float, 2 >::type
float2 type
Definition: register_traits.h:398

quda::TexVectorType< short, 4 >::type
short4 type
Definition: register_traits.h:404

quda::bridge_mapper< double2, double2 >::type
double2 type
Definition: register_traits.h:60

inline_ptx.h

quda::Trig::SinCos
__device__ static __host__ void SinCos(const T &a, T *s, T *c)
Definition: register_traits.h:297

quda::mapper< char >::type
float type
Definition: register_traits.h:47

quda::mapper< short >::type
float type
Definition: register_traits.h:46

quda::mapper< short2 >::type
float2 type
Definition: register_traits.h:51

quda::bridge_mapper< float2, char2 >::type
float2 type
Definition: register_traits.h:74

quda::VectorType< char, 2 >::type
char2 type
Definition: register_traits.h:386

quda::scalar< double >::type
double type
Definition: register_traits.h:117

quda::scalar< char2 >::type
char type
Definition: register_traits.h:128

quda::mapper< float4 >::type
float4 type
Definition: register_traits.h:55

quda::vector< double, 2 >::vector
vector(const type &a)
Definition: register_traits.h:95

quda::Trig::Cos
__device__ static __host__ T Cos(const T &a)
Definition: register_traits.h:296

quda::vector< float, 2 >::type
float2 type
Definition: register_traits.h:100

quda::scalar< char4 >::type
char type
Definition: register_traits.h:126

quda::bridge_mapper< float4, double2 >::type
float2 type
Definition: register_traits.h:67

quda::Trig< false, float >::Cos
__device__ static __host__ float Cos(const float &a)
Definition: register_traits.h:314

quda::TexVectorType< double, 1 >::type
int2 type
Definition: register_traits.h:393

errorQuda
#define errorQuda(...)
Definition: util_quda.h:121

quda::PromoteTypeId< double, int >::Type
double Type
Definition: register_traits.h:27

quda::TexVectorType< float, 1 >::type
float type
Definition: register_traits.h:397

quda::VectorType< double, 2 >::type
double2 type
Definition: register_traits.h:371

quda::vector< double, 2 >::a
type a
Definition: register_traits.h:94

quda::copy_scaled
__host__ __device__ void copy_scaled(T1 &a, const T2 &b)
Definition: register_traits.h:209

quda::Trig< true, float >::SinCos
__device__ static __host__ void SinCos(const float &a, float *s, float *c)
Definition: register_traits.h:356

quda::scalar< short4 >::type
short type
Definition: register_traits.h:122

quda::Trig< false, float >::Sin
__device__ static __host__ float Sin(const float &a)
Definition: register_traits.h:306

quda::Trig< false, float >::SinCos
__device__ static __host__ void SinCos(const float &a, float *s, float *c)
Definition: register_traits.h:323

quda::vector< int, 2 >::a
int2 a
Definition: register_traits.h:108

quda::VectorType< short, 4 >::type
short4 type
Definition: register_traits.h:382

quda::PromoteTypeId< int, float >::Type
float Type
Definition: register_traits.h:30

quda::copy
__host__ __device__ void copy(T1 &a, const T2 &b)
Definition: register_traits.h:152

quda::bridge_mapper< float4, short4 >::type
float4 type
Definition: register_traits.h:69

quda::mapper< char4 >::type
float4 type
Definition: register_traits.h:57

quda::complex< float >
Definition: complex_quda.h:458

quda::mapper< double2 >::type
double2 type
Definition: register_traits.h:49

quda::AllocType< false >::type
int type
Definition: register_traits.h:495

quda::bridge_mapper< double2, char2 >::type
float2 type
Definition: register_traits.h:63

quda::PromoteTypeId< double, complex< double > >::Type
complex< double > Type
Definition: register_traits.h:26

quda::VectorType< short, 2 >::type
short2 type
Definition: register_traits.h:381

quda::PromoteTypeId< complex< double >, double >::Type
complex< double > Type
Definition: register_traits.h:25

quda::mapper< short4 >::type
float4 type
Definition: register_traits.h:56

quda
Definition: blas_cublas.h:5

quda::bridge_mapper< double2, short2 >::type
float2 type
Definition: register_traits.h:62

quda::vector< float, 2 >::vector
vector(const double2 &a)
Definition: register_traits.h:102

quda::scalar< char3 >::type
char type
Definition: register_traits.h:127

quda::scalar
Definition: register_traits.h:113

quda::vector< int, 2 >::type
int2 type
Definition: register_traits.h:107

quda::TexVectorType< short, 2 >::type
short2 type
Definition: register_traits.h:403

quda::bridge_mapper< float2, double2 >::type
float2 type
Definition: register_traits.h:71

quda::TexVectorType
Definition: register_traits.h:390

quda::bridge_mapper< float4, float4 >::type
float4 type
Definition: register_traits.h:68

quda::vector< int, 2 >::vector
vector(const int2 &a)
Definition: register_traits.h:109

quda::scalar< short >::type
short type
Definition: register_traits.h:125

quda::VectorType< char, 1 >::type
char type
Definition: register_traits.h:385

quda::vector< double, 2 >::type
double2 type
Definition: register_traits.h:93

quda::VectorType
Definition: register_traits.h:367

quda::scalar< double4 >::type
double type
Definition: register_traits.h:114

quda::bridge_mapper< float4, char4 >::type
float4 type
Definition: register_traits.h:70

quda::TexVectorType< char, 4 >::type
char4 type
Definition: register_traits.h:409

quda::bridge_mapper< float2, short2 >::type
float2 type
Definition: register_traits.h:73

quda::sin
__host__ __device__ ValueType sin(ValueType x)
Definition: complex_quda.h:51

quda::Trig< true, float >::Sin
__device__ static __host__ float Sin(const float &a)
Definition: register_traits.h:339

quda::PromoteTypeId< double, float >::Type
double Type
Definition: register_traits.h:31

quda::vector_store
__device__ __host__ void vector_store(void *ptr, int idx, const VectorType &value)
Definition: register_traits.h:422

quda::scalar< short2 >::type
short type
Definition: register_traits.h:124

quda::atan2
__host__ __device__ ValueType atan2(ValueType x, ValueType y)
Definition: complex_quda.h:76

quda::PromoteTypeId< float, complex< float > >::Type
complex< float > Type
Definition: register_traits.h:24

quda::bridge_mapper< double2, char4 >::type
float4 type
Definition: register_traits.h:66

quda::PromoteTypeId< float, int >::Type
float Type
Definition: register_traits.h:29

quda::Trig< false, float >::Atan2
__device__ static __host__ float Atan2(const float &a, const float &b)
Definition: register_traits.h:305

quda::VectorType< char, 4 >::type
char4 type
Definition: register_traits.h:387

quda::vec_length
Definition: register_traits.h:76

quda::scalar< double2 >::type
double type
Definition: register_traits.h:116

quda::store_streaming_double2
__device__ void store_streaming_double2(double2 *addr, double x, double y)
Definition: inline_ptx.h:88

quda::bridge_mapper< double2, float4 >::type
double4 type
Definition: register_traits.h:64

quda::bridge_mapper< double2, short4 >::type
float4 type
Definition: register_traits.h:65

quda::scalar< float4 >::type
float type
Definition: register_traits.h:118

quda::scalar< double3 >::type
double type
Definition: register_traits.h:115

quda::PromoteTypeId< complex< float >, float >::Type
complex< float > Type
Definition: register_traits.h:23

quda::TexVectorType< double, 2 >::type
int4 type
Definition: register_traits.h:394

quda::vector< float, 2 >::a
float2 a
Definition: register_traits.h:101

quda::bridge_mapper< double2, float2 >::type
double2 type
Definition: register_traits.h:61

quda::mapper< char2 >::type
float2 type
Definition: register_traits.h:52

quda::store_streaming_float4
__device__ void store_streaming_float4(float4 *addr, float x, float y, float z, float w)
Definition: inline_ptx.h:78

quda::VectorType< double, 4 >::type
double4 type
Definition: register_traits.h:372

quda::isFixed
Definition: register_traits.h:144

quda::TexVectorType< char, 2 >::type
char2 type
Definition: register_traits.h:408

quda::Trig< true, float >::Atan2
__device__ static __host__ float Atan2(const float &a, const float &b)
Definition: register_traits.h:338

quda::mapper
Definition: register_traits.h:43

quda::PromoteTypeId
Definition: register_traits.h:22

quda::s
__shared__ float s[]

quda::PromoteTypeId::Type
T Type
Definition: register_traits.h:22

quda::VectorType< float, 1 >::type
float type
Definition: register_traits.h:375

quda::Trig< true, float >::Cos
__device__ static __host__ float Cos(const float &a)
Definition: register_traits.h:347

quda::mapper< float >::type
float type
Definition: register_traits.h:45

quda::store_streaming_float2
__device__ void store_streaming_float2(float2 *addr, float x, float y)
Definition: inline_ptx.h:93

quda::Trig::Sin
__device__ static __host__ T Sin(const T &a)
Definition: register_traits.h:295

quda::s2f
__host__ __device__ float s2f(short a)
Definition: convert.h:34

complex_quda.h

quda::TexVectorType< char, 1 >::type
char type
Definition: register_traits.h:407

quda::PromoteTypeId< float, double >::Type
double Type
Definition: register_traits.h:32

quda::vector_load
__device__ __host__ VectorType vector_load(void *ptr, int idx)
Definition: register_traits.h:412

quda::bridge_mapper
Definition: register_traits.h:59

quda::cos
__host__ __device__ ValueType cos(ValueType x)
Definition: complex_quda.h:46

quda::mapper< double4 >::type
double4 type
Definition: register_traits.h:54

quda::complex< double >
Definition: complex_quda.h:580

quda::scalar< float3 >::type
float type
Definition: register_traits.h:119

quda::store_streaming_short2
__device__ void store_streaming_short2(short2 *addr, short x, short y)
Definition: inline_ptx.h:98

quda::TexVectorType< float, 4 >::type
float4 type
Definition: register_traits.h:399

quda::isHalf
Definition: register_traits.h:132

quda::VectorType< double, 1 >::type
double type
Definition: register_traits.h:370

quda::AllocType< true >::type
size_t type
Definition: register_traits.h:494

quda::isQuarter
Definition: register_traits.h:138

quda::AllocType
Definition: register_traits.h:493

quda::scalar< float >::type
float type
Definition: register_traits.h:121

quda::TexVectorType< short, 1 >::type
short type
Definition: register_traits.h:402

quda::scalar< char >::type
char type
Definition: register_traits.h:129

quda::store_streaming_short4
__device__ void store_streaming_short4(short4 *addr, short x, short y, short z, short w)
Definition: inline_ptx.h:83

quda::VectorType< short, 1 >::type
short type
Definition: register_traits.h:380

convert.h

quda::mapper< float2 >::type
float2 type
Definition: register_traits.h:50

quda::mapper< double >::type
double type
Definition: register_traits.h:44

quda::f2i
__device__ __host__ int f2i(float f)
Definition: convert.h:93

quda::scalar< short3 >::type
short type
Definition: register_traits.h:123

quda::c2f
__host__ __device__ float c2f(char a)
Definition: convert.h:38

quda::VectorType< float, 4 >::type
float4 type
Definition: register_traits.h:377

quda::PromoteTypeId< int, double >::Type
double Type
Definition: register_traits.h:28

quda::bridge_mapper< float2, float2 >::type
float2 type
Definition: register_traits.h:72

quda::fixedMaxValue
Definition: quda_internal.h:53

quda::VectorType< float, 2 >::type
float2 type
Definition: register_traits.h:376

quda::scalar< float2 >::type
float type
Definition: register_traits.h:120

quda::Trig::Atan2
__device__ static __host__ T Atan2(const T &a, const T &b)
Definition: register_traits.h:294

quda_internal.h

quda::Trig
Definition: register_traits.h:293

quda::copy_and_scale
__host__ __device__ void copy_and_scale(T1 &a, const T2 &b, const T3 &c)
Specialized variants of the copy function that include an additional scale factor. Note the scale factor is ignored unless the input type (b) is either a short or char vector.
Definition: register_traits.h:249