quda-ref/v1.1.0/convert_8h_source.html

 #pragma once


 #include <type_traits>

 #include <quda_internal.h> // for maximum short, char traits.

 #include <register_traits.h>


 namespace quda

 {


   template <typename T> __host__ __device__ inline float i2f(T a)

   {

 #if 1

     return static_cast<float>(a);

 #else

     // will work for up to 23-bit int

     union {

       int32_t i;

       float f;

     };

     i = a + 0x4B400000;

     return f - 12582912.0f;

 #endif

   }


   // Fast float to integer round

   __device__ __host__ inline int f2i(float f)

   {

 #ifdef __CUDA_ARCH__

     f += 12582912.0f;

     return reinterpret_cast<int &>(f);

 #else

     return static_cast<int>(f);

 #endif

   }


   // Fast double to integer round

   __device__ __host__ inline int d2i(double d)

   {

 #ifdef __CUDA_ARCH__

     d += 6755399441055744.0;

     return reinterpret_cast<int &>(d);

 #else

     return static_cast<int>(d);

 #endif

   }


   template <typename T1, typename T2>

   __host__ __device__ inline typename std::enable_if<!isFixed<T1>::value && !isFixed<T2>::value, void>::type

   copy(T1 &a, const T2 &b)

   {

     a = b;

   }


   template <typename T1, typename T2>

   __host__ __device__ inline typename std::enable_if<!isFixed<T1>::value && isFixed<T2>::value, void>::type

   copy(T1 &a, const T2 &b)

   {

     a = i2f(b) * fixedInvMaxValue<T2>::value;

   }


   template <typename T1, typename T2>

   __host__ __device__ inline typename std::enable_if<isFixed<T1>::value && !isFixed<T2>::value, void>::type

   copy(T1 &a, const T2 &b)

   {

     a = f2i(b * fixedMaxValue<T1>::value);

   }


   template <typename T1, typename T2>

   __host__ __device__ inline typename std::enable_if<!isFixed<T1>::value, void>::type copy_scaled(T1 &a, const T2 &b)

   {

     copy(a, b);

   }


   template <typename T1, typename T2>

   __host__ __device__ inline typename std::enable_if<isFixed<T1>::value, void>::type copy_scaled(T1 &a, const T2 &b)

   {

     a = f2i(b);

   }


   template <typename T1, typename T2, typename T3>

   __host__ __device__ inline typename std::enable_if<!isFixed<T2>::value, void>::type copy_and_scale(T1 &a, const T2 &b,

                                                                                                      const T3 &c)

   {

     copy(a, b);

   }


   template <typename T1, typename T2, typename T3>

   __host__ __device__ inline typename std::enable_if<isFixed<T2>::value, void>::type copy_and_scale(T1 &a, const T2 &b,

                                                                                                     const T3 &c)

   {

     a = i2f(b) * fixedInvMaxValue<T2>::value * c;

   }


 } // namespace quda

quda
Definition: blas_lapack.h:24

quda::i2f
__host__ __device__ float i2f(T a)
Definition: convert.h:18

quda::f2i
__device__ __host__ int f2i(float f)
Definition: convert.h:34

quda::d2i
__device__ __host__ int d2i(double d)
Definition: convert.h:45

quda::copy_scaled
__host__ __device__ std::enable_if<!isFixed< T1 >::value, void >::type copy_scaled(T1 &a, const T2 &b)
Specialized variants of the copy function that assumes the scaling factor has already been done.
Definition: convert.h:88

quda::copy
__host__ __device__ std::enable_if<!isFixed< T1 >::value &&!isFixed< T2 >::value, void >::type copy(T1 &a, const T2 &b)
Copy function which is trival between floating point types. When converting to an integer type,...
Definition: convert.h:64

quda::copy_and_scale
__host__ __device__ std::enable_if<!isFixed< T2 >::value, void >::type copy_and_scale(T1 &a, const T2 &b, const T3 &c)
Specialized variants of the copy function that include an additional scale factor....
Definition: convert.h:105

quda_internal.h

register_traits.h
Provides precision abstractions and defines the register precision given the storage precision using ...

quda::fixedInvMaxValue
Definition: quda_internal.h:109

quda::fixedMaxValue
Definition: quda_internal.h:93

quda::isFixed::value
static const bool value
Definition: register_traits.h:348