quda-ref/v0.7.0/complex__quda_8h_source.html

 /*

 * Copyright 2008-2009 NVIDIA Corporation

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 * http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


 #pragma once


 #include <math.h>

 #include <cmath>

 #include <complex>

 #include <sstream>

 #include <cuComplex.h>


 // We need this to make sure code inside quda:: that calls sqrt() using real numbers

 // doesn't try to call the complex sqrt, but the standard sqrt

 namespace quda

 {

   template <typename ValueType>

     __host__ __device__

     inline ValueType cos(ValueType x){

     return std::cos(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType sin(ValueType x){

     return std::sin(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType tan(ValueType x){

     return std::tan(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType acos(ValueType x){

     return std::acos(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType asin(ValueType x){

     return std::asin(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType atan(ValueType x){

     return std::atan(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType atan2(ValueType x,ValueType y){

     return std::atan2(x,y);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType cosh(ValueType x){

     return std::cosh(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType sinh(ValueType x){

     return std::sinh(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType tanh(ValueType x){

     return std::tanh(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType exp(ValueType x){

     return std::exp(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType log(ValueType x){

     return std::log(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType log10(ValueType x){

     return std::log10(x);

   }

   template <typename ValueType, typename ExponentType>

     __host__ __device__

     inline ValueType pow(ValueType x, ExponentType e){

     return std::pow(x,e);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType sqrt(ValueType x){

     return std::sqrt(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType abs(ValueType x){

     return std::abs(x);

   }

   template <typename ValueType>

     __host__ __device__

     inline ValueType conj(ValueType x){

     return x;

   }


   template <typename ValueType> struct complex;

   template <> struct complex<float>;

   template <> struct complex<double>;


   template<typename ValueType>

   __host__ __device__

   ValueType abs(const complex<ValueType>& z);

   template<typename ValueType>

   __host__ __device__

   ValueType arg(const complex<ValueType>& z);

   template<typename ValueType>

   __host__ __device__

   ValueType norm(const complex<ValueType>& z);


   template<typename ValueType>

   __host__ __device__

   complex<ValueType> conj(const complex<ValueType>& z);

   template<typename ValueType>

   __host__ __device__

   complex<ValueType> polar(const ValueType& m, const ValueType& theta = 0);


   // Arithmetic operators:

   // Multiplication

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator*(const complex<ValueType>& lhs, const complex<ValueType>& rhs);

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator*(const complex<ValueType>& lhs, const ValueType & rhs);

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator*(const ValueType& lhs, const complex<ValueType>& rhs);

   // Division

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator/(const complex<ValueType>& lhs, const complex<ValueType>& rhs);

   template <>

     __host__ __device__

     inline complex<float> operator/(const complex<float>& lhs, const complex<float>& rhs);

   template <>

     __host__ __device__

     inline complex<double> operator/(const complex<double>& lhs, const complex<double>& rhs);


   // Addition

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const complex<ValueType>& lhs, const complex<ValueType>& rhs);

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const complex<ValueType>& lhs, const ValueType & rhs);

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const ValueType& lhs, const complex<ValueType>& rhs);

   // Subtraction

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator-(const complex<ValueType>& lhs, const complex<ValueType>& rhs);

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator-(const complex<ValueType>& lhs, const ValueType & rhs);

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator-(const ValueType& lhs, const complex<ValueType>& rhs);


   // Unary plus and minus

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const complex<ValueType>& rhs);

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator-(const complex<ValueType>& rhs);


   // Transcendentals:

   // Returns the complex cosine of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> cos(const complex<ValueType>& z);

   // Returns the complex hyperbolic cosine of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> cosh(const complex<ValueType>& z);

   // Returns the complex base e exponential of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> exp(const complex<ValueType>& z);

   // Returns the complex natural logarithm of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> log(const complex<ValueType>& z);

   // Returns the complex base 10 logarithm of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> log10(const complex<ValueType>& z);

   // Returns z to the n'th power.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> pow(const complex<ValueType>& z, const int& n);

   // Returns z to the x'th power.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> pow(const complex<ValueType>&z, const ValueType&x);

   // Returns z to the z2'th power.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> pow(const complex<ValueType>&z,

 const complex<ValueType>&z2);

   // Returns x to the z'th power.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> pow(const ValueType& x, const complex<ValueType>& z);

   // Returns the complex sine of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> sin(const complex<ValueType>&z);

   // Returns the complex hyperbolic sine of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> sinh(const complex<ValueType>&z);

   // Returns the complex square root of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> sqrt(const complex<ValueType>&z);

   // Returns the complex tangent of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> tan(const complex<ValueType>&z);

   // Returns the complex hyperbolic tangent of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> tanh(const complex<ValueType>&z);


   // Inverse Trigonometric:

   // Returns the complex arc cosine of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> acos(const complex<ValueType>& z);

   // Returns the complex arc sine of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> asin(const complex<ValueType>& z);

   // Returns the complex arc tangent of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> atan(const complex<ValueType>& z);

   // Returns the complex hyperbolic arc cosine of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> acosh(const complex<ValueType>& z);

   // Returns the complex hyperbolic arc sine of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> asinh(const complex<ValueType>& z);

   // Returns the complex hyperbolic arc tangent of z.

   template <typename ValueType>

     __host__ __device__

   complex<ValueType> atanh(const complex<ValueType>& z);


   // Stream operators:

   template<typename ValueType,class charT, class traits>

     std::basic_ostream<charT, traits>& operator<<(std::basic_ostream<charT, traits>& os, const complex<ValueType>& z);

   template<typename ValueType, typename charT, class traits>

     std::basic_istream<charT, traits>&

     operator>>(std::basic_istream<charT, traits>& is, complex<ValueType>& z);


   // Stream operators

   template<typename ValueType,class charT, class traits>

     std::basic_ostream<charT, traits>& operator<<(std::basic_ostream<charT, traits>& os, const complex<ValueType>& z)

     {

       os << '(' << z.real() << ',' << z.imag() << ')';

       return os;

     };


   template<typename ValueType, typename charT, class traits>

     std::basic_istream<charT, traits>&

     operator>>(std::basic_istream<charT, traits>& is, complex<ValueType>& z)

     {

       ValueType re, im;


       charT ch;

       is >> ch;


       if(ch == '(')

       {

         is >> re >> ch;

         if (ch == ',')

         {

           is >> im >> ch;

           if (ch == ')')

           {

             z = complex<ValueType>(re, im);

           }

           else

           {

             is.setstate(std::ios_base::failbit);

           }

         }

         else if (ch == ')')

         {

           z = re;

         }

         else

         {

           is.setstate(std::ios_base::failbit);

         }

       }

       else

       {

         is.putback(ch);

         is >> re;

         z = re;

       }

       return is;

     }


 template <typename T>

   struct norm_type {

     typedef T type;

   };

  template <typename T>

    struct norm_type< complex<T> > {

    typedef T type;

  };


 template <typename ValueType>

 struct complex

 {

 public:

   typedef ValueType value_type;


   // Constructors

   __host__ __device__

     inline complex<ValueType>(const ValueType & re = ValueType(), const ValueType& im = ValueType())

     {

       real(re);

       imag(im);

     }


   template <class X>

     __host__ __device__

     inline complex<ValueType>(const complex<X> & z)

     {

       real(z.real());

       imag(z.imag());

     }


   template <class X>

     __host__ __device__

     inline complex<ValueType>(const std::complex<X> & z)

     {

       real(z.real());

       imag(z.imag());

     }


   template <typename T>

     __host__ __device__

     inline complex<ValueType>& operator=(const complex<T> z)

     {

       real(z.real());

       imag(z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<ValueType>& operator+=(const complex<ValueType> z)

     {

       real(real()+z.real());

       imag(imag()+z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<ValueType>& operator-=(const complex<ValueType> z)

     {

       real(real()-z.real());

       imag(imag()-z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<ValueType>& operator*=(const complex<ValueType> z)

     {

       *this = *this * z;

       return *this;

     }


   __host__ __device__

     inline complex<ValueType>& operator/=(const complex<ValueType> z)

     {

       *this = *this / z;

       return *this;

     }


   __host__ __device__ inline ValueType real() const volatile;

   __host__ __device__ inline ValueType imag() const volatile;

   __host__ __device__ inline ValueType real() const;

   __host__ __device__ inline ValueType imag() const;

   __host__ __device__ inline void real(ValueType) volatile;

   __host__ __device__ inline void imag(ValueType) volatile;

   __host__ __device__ inline void real(ValueType);

   __host__ __device__ inline void imag(ValueType);

 };


 // TODO make cuFloatComplex and cuDoubleComplex protected

 // TODO see if returning references is a perf hazard


 template<>

 struct complex <float> : public cuFloatComplex

 {

 public:

   typedef float value_type;

   __host__ __device__

     inline complex<float>(){};

   __host__ __device__

     inline complex<float>(const float & re, const float& im = float())

     {

       real(re);

       imag(im);

     }


   // For some reason having the following constructor

   // explicitly makes things faster with at least g++

   __host__ __device__

     complex<float>(const complex<float> & z)

     : cuFloatComplex(z){}


   __host__ __device__

     complex<float>(cuFloatComplex z)

     : cuFloatComplex(z){}


   template <class X>

     inline complex<float>(const std::complex<X> & z)

     {

       real(z.real());

       imag(z.imag());

     }


   // Member operators

   template <typename T>

     __host__ __device__

     inline volatile complex<float>& operator=(const complex<T> z) volatile

     {

       real(z.real());

       imag(z.imag());

       return *this;

     }


   template <typename T>

     __host__ __device__

     inline complex<float>& operator=(const complex<T> z)

     {

       real(z.real());

       imag(z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<float>& operator+=(const complex<float> z)

     {

       real(real()+z.real());

       imag(imag()+z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<float>& operator-=(const complex<float> z)

     {

       real(real()-z.real());

       imag(imag()-z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<float>& operator*=(const complex<float> z)

     {

       *this = *this * z;

       return *this;

     }


   __host__ __device__

     inline complex<float>& operator/=(const complex<float> z)

     {

       *this = *this / z;

       return *this;

     }


   // Let the compiler synthesize the copy and assignment operators.

   __host__ __device__ inline complex<float>(const volatile complex<float> & z)

   {

     real(z.real());

     imag(z.imag());

   }


   __host__ __device__ inline float real() const volatile{ return x; }

   __host__ __device__ inline float imag() const volatile{ return y; }

   __host__ __device__ inline float real() const{ return x; }

   __host__ __device__ inline float imag() const{ return y; }

   __host__ __device__ inline void real(float re)volatile{ x = re; }

   __host__ __device__ inline void imag(float im)volatile{ y = im; }

   __host__ __device__ inline void real(float re){ x = re; }

   __host__ __device__ inline void imag(float im){ y = im; }


   // cast operators

   inline operator std::complex<float>() const { return std::complex<float>(real(),imag()); }

   // inline operator float() const { return real(); }

 };


 template<>

 struct complex <double> : public cuDoubleComplex

 {

 public:

   typedef double value_type;

   __host__ __device__

     inline complex<double>(){};

   __host__ __device__

     inline complex<double>(const double & re, const double& im = double())

     {

       real(re);

       imag(im);

     }


   // For some reason having the following constructor

   // explicitly makes things faster with at least g++

   __host__ __device__

     inline complex<double>(const complex<double> & z)

     : cuDoubleComplex(z) {}


   __host__ __device__

     inline complex<double>(cuDoubleComplex z)

     : cuDoubleComplex(z) {}


   template <class X>

     inline complex<double>(const std::complex<X> & z)

     {

       real(z.real());

       imag(z.imag());

     }


   // Member operators

   template <typename T>

     __host__ __device__

     inline volatile complex<double>& operator=(const complex<T> z) volatile

     {

       real(z.real());

       imag(z.imag());

       return *this;

     }


   template <typename T>

     __host__ __device__

     inline complex<double>& operator=(const complex<T> z)

     {

       real(z.real());

       imag(z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<double>& operator+=(const complex<double> z)

     {

       real(real()+z.real());

       imag(imag()+z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<double>& operator-=(const complex<double> z)

     {

       real(real()-z.real());

       imag(imag()-z.imag());

       return *this;

     }


   __host__ __device__

     inline complex<double>& operator*=(const complex<double> z)

     {

       *this = *this * z;

       return *this;

     }


   __host__ __device__

     inline complex<double>& operator/=(const complex<double> z)

     {

       *this = *this / z;

       return *this;

     }


   __host__ __device__ inline complex<double>(const volatile complex<double> & z)

   {

     real(z.real());

     imag(z.imag());

   }


   // Let the compiler synthesize the copy and assignment operators.

   __host__ __device__ inline double real() const volatile { return x; }

   __host__ __device__ inline double imag() const volatile { return y; }

   __host__ __device__ inline double real() const { return x; }

   __host__ __device__ inline double imag() const { return y; }

   __host__ __device__ inline void real(double re)volatile{ x = re; }

   __host__ __device__ inline void imag(double im)volatile{ y = im; }

   __host__ __device__ inline void real(double re){ x = re; }

   __host__ __device__ inline void imag(double im){ y = im; }


   // cast operators

   inline operator std::complex<double>() const { return std::complex<double>(real(),imag()); }

   // inline operator double() { return real(); }

 };


   // Binary arithmetic operations

   // At the moment I'm implementing the basic functions, and the

   // corresponding cuComplex calls are commented.


   template<typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const complex<ValueType>& lhs,

 const complex<ValueType>& rhs){

     return complex<ValueType>(lhs.real()+rhs.real(),lhs.imag()+rhs.imag());

     // return cuCaddf(lhs,rhs);

   }


   template<typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const volatile complex<ValueType>& lhs,

 const volatile complex<ValueType>& rhs){

     return complex<ValueType>(lhs.real()+rhs.real(),lhs.imag()+rhs.imag());

     // return cuCaddf(lhs,rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const complex<ValueType>& lhs, const ValueType & rhs){

     return complex<ValueType>(lhs.real()+rhs,lhs.imag());

     // return cuCaddf(lhs,complex<ValueType>(rhs));

   }

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const ValueType& lhs, const complex<ValueType>& rhs){

     return complex<ValueType>(rhs.real()+lhs,rhs.imag());

     // return cuCaddf(complex<float>(lhs),rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator-(const complex<ValueType>& lhs, const complex<ValueType>& rhs){

     return complex<ValueType>(lhs.real()-rhs.real(),lhs.imag()-rhs.imag());

     // return cuCsubf(lhs,rhs);

   }

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator-(const complex<ValueType>& lhs, const ValueType & rhs){

     return complex<ValueType>(lhs.real()-rhs,lhs.imag());

     // return cuCsubf(lhs,complex<float>(rhs));

   }

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator-(const ValueType& lhs, const complex<ValueType>& rhs){

     return complex<ValueType>(lhs-rhs.real(),-rhs.imag());

     // return cuCsubf(complex<float>(lhs),rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator*(const complex<ValueType>& lhs,

 const complex<ValueType>& rhs){

     return complex<ValueType>(lhs.real()*rhs.real()-lhs.imag()*rhs.imag(),

 lhs.real()*rhs.imag()+lhs.imag()*rhs.real());

     // return cuCmulf(lhs,rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator*(const complex<ValueType>& lhs, const ValueType & rhs){

     return complex<ValueType>(lhs.real()*rhs,lhs.imag()*rhs);

     // return cuCmulf(lhs,complex<float>(rhs));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator*(const ValueType& lhs, const complex<ValueType>& rhs){

     return complex<ValueType>(rhs.real()*lhs,rhs.imag()*lhs);

     // return cuCmulf(complex<float>(lhs),rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator/(const complex<ValueType>& lhs, const complex<ValueType>& rhs){

     const ValueType cross_norm = lhs.real() * rhs.real() + lhs.imag() * rhs.imag();

     const ValueType rhs_norm = norm(rhs);

     return complex<ValueType>(cross_norm/rhs_norm,

 (lhs.imag() * rhs.real() - lhs.real() * rhs.imag()) / rhs_norm);

   }


   template <>

     __host__ __device__

     inline complex<float> operator/(const complex<float>& lhs, const complex<float>& rhs){

     return cuCdivf(lhs,rhs);

   }


   template <>

     __host__ __device__

     inline complex<double> operator/(const complex<double>& lhs, const complex<double>& rhs){

     return cuCdiv(lhs,rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator/(const complex<ValueType>& lhs, const ValueType & rhs){

     return complex<ValueType>(lhs.real()/rhs,lhs.imag()/rhs);

     // return cuCdivf(lhs,complex<float>(rhs));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator/(const ValueType& lhs, const complex<ValueType>& rhs){

     const ValueType cross_norm = lhs * rhs.real();

     const ValueType rhs_norm = norm(rhs);

     return complex<ValueType>(cross_norm/rhs_norm,(-lhs.real() * rhs.imag()) / rhs_norm);

   }


   template <>

     __host__ __device__

     inline complex<float> operator/(const float& lhs, const complex<float>& rhs){

     return cuCdivf(complex<float>(lhs),rhs);

   }

   template <>

     __host__ __device__

     inline complex<double> operator/(const double& lhs, const complex<double>& rhs){

     return cuCdiv(complex<double>(lhs),rhs);

   }


   // Unary arithmetic operations

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator+(const complex<ValueType>& rhs){

     return rhs;

   }

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> operator-(const complex<ValueType>& rhs){

     return rhs*-ValueType(1);

   }


   // Equality operators

   template <typename ValueType>

     __host__ __device__

     inline bool operator==(const complex<ValueType>& lhs, const complex<ValueType>& rhs){

     if(lhs.real() == rhs.real() && lhs.imag() == rhs.imag()){

       return true;

     }

     return false;

   }

   template <typename ValueType>

     __host__ __device__

     inline bool operator==(const ValueType & lhs, const complex<ValueType>& rhs){

     if(lhs == rhs.real() && rhs.imag() == 0){

       return true;

     }

     return false;

   }

   template <typename ValueType>

     __host__ __device__

     inline bool operator==(const complex<ValueType> & lhs, const ValueType& rhs){

     if(lhs.real() == rhs && lhs.imag() == 0){

       return true;

     }

     return false;

   }


   template <typename ValueType>

     __host__ __device__

     inline bool operator!=(const complex<ValueType>& lhs, const complex<ValueType>& rhs){

     return !(lhs == rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline bool operator!=(const ValueType & lhs, const complex<ValueType>& rhs){

     return !(lhs == rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline bool operator!=(const complex<ValueType> & lhs, const ValueType& rhs){

     return !(lhs == rhs);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> conj(const complex<ValueType>& z){

     return complex<ValueType>(z.real(),-z.imag());

   }


   template <typename ValueType>

     __host__ __device__

     inline ValueType abs(const complex<ValueType>& z){

     return ::hypot(z.real(),z.imag());

   }

   template <>

     __host__ __device__

     inline float abs(const complex<float>& z){

     return ::hypotf(z.real(),z.imag());

   }

   template<>

     __host__ __device__

     inline double abs(const complex<double>& z){

     return ::hypot(z.real(),z.imag());

   }


   template <typename ValueType>

     __host__ __device__

     inline ValueType arg(const complex<ValueType>& z){

     return atan2(z.imag(),z.real());

   }

   template<>

     __host__ __device__

     inline float arg(const complex<float>& z){

     return atan2f(z.imag(),z.real());

   }

   template<>

     __host__ __device__

     inline double arg(const complex<double>& z){

     return atan2(z.imag(),z.real());

   }


   template <typename ValueType>

     __host__ __device__

     inline ValueType norm(const complex<ValueType>& z){

     return z.real()*z.real() + z.imag()*z.imag();

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> polar(const ValueType & m, const ValueType & theta){

     return complex<ValueType>(m * ::cos(theta),m * ::sin(theta));

   }


   template <>

     __host__ __device__

     inline complex<float> polar(const float & magnitude, const float & angle){

     return complex<float>(magnitude * ::cosf(angle),magnitude * ::sinf(angle));

   }


   template <>

     __host__ __device__

     inline complex<double> polar(const double & magnitude, const double & angle){

     return complex<double>(magnitude * ::cos(angle),magnitude * ::sin(angle));

   }


   // Transcendental functions implementation

   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> cos(const complex<ValueType>& z){

     const ValueType re = z.real();

     const ValueType im = z.imag();

     return complex<ValueType>(::cos(re) * ::cosh(im), -::sin(re) * ::sinh(im));

   }


   template <>

     __host__ __device__

     inline complex<float> cos(const complex<float>& z){

     const float re = z.real();

     const float im = z.imag();

     return complex<float>(cosf(re) * coshf(im), -sinf(re) * sinhf(im));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> cosh(const complex<ValueType>& z){

     const ValueType re = z.real();

     const ValueType im = z.imag();

     return complex<ValueType>(::cosh(re) * ::cos(im), ::sinh(re) * ::sin(im));

   }


   template <>

     __host__ __device__

     inline complex<float> cosh(const complex<float>& z){

     const float re = z.real();

     const float im = z.imag();

     return complex<float>(::coshf(re) * ::cosf(im), ::sinhf(re) * ::sinf(im));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> exp(const complex<ValueType>& z){

     return polar(::exp(z.real()),z.imag());

   }


   template <>

     __host__ __device__

     inline complex<float> exp(const complex<float>& z){

     return polar(::expf(z.real()),z.imag());

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> log(const complex<ValueType>& z){

     return complex<ValueType>(::log(abs(z)),arg(z));

   }


   template <>

     __host__ __device__

     inline complex<float> log(const complex<float>& z){

     return complex<float>(::logf(abs(z)),arg(z));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> log10(const complex<ValueType>& z){

     // Using the explicit literal prevents compile time warnings in

     // devices that don't support doubles

     return log(z)/ValueType(2.30258509299404568402);

     // return log(z)/ValueType(::log(10.0));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> pow(const complex<ValueType>& z, const ValueType & exponent){

     return exp(log(z)*exponent);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> pow(const complex<ValueType>& z, const complex<ValueType> & exponent){

     return exp(log(z)*exponent);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> pow(const ValueType & x, const complex<ValueType> & exponent){

     return exp(::log(x)*exponent);

   }


   template <>

     __host__ __device__

     inline complex<float> pow(const float & x, const complex<float> & exponent){

     return exp(::logf(x)*exponent);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> pow(const complex<ValueType>& z,const int & exponent){

     return exp(log(z)*ValueType(exponent));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> sin(const complex<ValueType>& z){

     const ValueType re = z.real();

     const ValueType im = z.imag();

     return complex<ValueType>(::sin(re) * ::cosh(im), ::cos(re) * ::sinh(im));

   }


   template <>

     __host__ __device__

     inline complex<float> sin(const complex<float>& z){

     const float re = z.real();

     const float im = z.imag();

     return complex<float>(::sinf(re) * ::coshf(im), ::cosf(re) * ::sinhf(im));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> sinh(const complex<ValueType>& z){

     const ValueType re = z.real();

     const ValueType im = z.imag();

     return complex<ValueType>(::sinh(re) * ::cos(im), ::cosh(re) * ::sin(im));

   }


   template <>

     __host__ __device__

     inline complex<float> sinh(const complex<float>& z){

     const float re = z.real();

     const float im = z.imag();

     return complex<float>(::sinhf(re) * ::cosf(im), ::coshf(re) * ::sinf(im));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> sqrt(const complex<ValueType>& z){

     return polar(::sqrt(abs(z)),arg(z)/ValueType(2));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<float> sqrt(const complex<float>& z){

     return polar(::sqrtf(abs(z)),arg(z)/float(2));

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> tan(const complex<ValueType>& z){

     return sin(z)/cos(z);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> tanh(const complex<ValueType>& z){

     // This implementation seems better than the simple sin/cos

     return (exp(ValueType(2)*z)-ValueType(1))/(exp(ValueType(2)*z)+ValueType(1));

     // return sinh(z)/cosh(z);

   }


   // Inverse trigonometric functions implementation


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> acos(const complex<ValueType>& z){

     const complex<ValueType> ret = asin(z);

     return complex<ValueType>(ValueType(M_PI/2.0) - ret.real(),-ret.imag());

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> asin(const complex<ValueType>& z){

     const complex<ValueType> i(0,1);

     return -i*asinh(i*z);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> atan(const complex<ValueType>& z){

     const complex<ValueType> i(0,1);

     return -i*atanh(i*z);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> acosh(const complex<ValueType>& z){

     quda::complex<ValueType> ret((z.real() - z.imag()) * (z.real() + z.imag()) - ValueType(1.0),

 ValueType(2.0) * z.real() * z.imag());

     ret = sqrt(ret);

     if (z.real() < ValueType(0.0)){

       ret = -ret;

     }

     ret += z;

     ret = log(ret);

     if (ret.real() < ValueType(0.0)){

       ret = -ret;

     }

     return ret;


     /*

 quda::complex<ValueType> ret = log(sqrt(z*z-ValueType(1))+z);

 if(ret.real() < 0){

 ret.real(-ret.real());

 }

 return ret;

 */

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> asinh(const complex<ValueType>& z){

     return log(sqrt(z*z+ValueType(1))+z);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<ValueType> atanh(const complex<ValueType>& z){

     ValueType imag2 = z.imag() * z.imag();

     ValueType n = ValueType(1.0) + z.real();

     n = imag2 + n * n;


     ValueType d = ValueType(1.0) - z.real();

     d = imag2 + d * d;

     complex<ValueType> ret(ValueType(0.25) * (::log(n) - ::log(d)),0);


     d = ValueType(1.0) - z.real() * z.real() - imag2;


     ret.imag(ValueType(0.5) * ::atan2(ValueType(2.0) * z.imag(), d));

     return ret;

     //return (log(ValueType(1)+z)-log(ValueType(1)-z))/ValueType(2);

   }


   template <typename ValueType>

     __host__ __device__

     inline complex<float> atanh(const complex<float>& z){

         float imag2 = z.imag() * z.imag();

     float n = float(1.0) + z.real();

     n = imag2 + n * n;


     float d = float(1.0) - z.real();

     d = imag2 + d * d;

     complex<float> ret(float(0.25) * (::logf(n) - ::logf(d)),0);


     d = float(1.0) - z.real() * z.real() - imag2;


     ret.imag(float(0.5) * ::atan2f(float(2.0) * z.imag(), d));

     return ret;

     //return (log(ValueType(1)+z)-log(ValueType(1)-z))/ValueType(2);


   }


 } // end namespace quda

quda::sinh
__host__ __device__ complex< float > sinh(const complex< float > &z)
Definition: complex_quda.h:1005

quda::tanh
__host__ __device__ ValueType tanh(ValueType x)
Definition: complex_quda.h:80

quda::sinh
__host__ __device__ ValueType sinh(ValueType x)
Definition: complex_quda.h:75

quda::complex< float >::operator-=
__host__ __device__ complex< float > & operator-=(const complex< float > z)
Definition: complex_quda.h:493

quda::complex< double >::operator=
__host__ __device__ complex< double > & operator=(const complex< T > z)
Definition: complex_quda.h:578

y
int y[4]
Definition: staggered_dslash_core.h:356

quda::complex::value_type
ValueType value_type
Definition: complex_quda.h:356

quda::norm
__host__ __device__ ValueType norm(const complex< ValueType > &z)
Returns the magnitude of z squared.
Definition: complex_quda.h:859

quda::atan
__host__ __device__ ValueType atan(ValueType x)
Definition: complex_quda.h:60

quda::complex< double >::operator-=
__host__ __device__ complex< double > & operator-=(const complex< double > z)
Definition: complex_quda.h:594

quda::exp
__host__ __device__ ValueType exp(ValueType x)
Definition: complex_quda.h:85

quda::complex< float >::operator*=
__host__ __device__ complex< float > & operator*=(const complex< float > z)
Definition: complex_quda.h:501

quda::cosh
__host__ __device__ ValueType cosh(ValueType x)
Definition: complex_quda.h:70

quda::complex< double >::real
__host__ __device__ void real(double re) volatile
Definition: complex_quda.h:626

quda::sqrt
__host__ __device__ ValueType sqrt(ValueType x)
Definition: complex_quda.h:105

quda::cosh
__host__ __device__ complex< float > cosh(const complex< float > &z)
Definition: complex_quda.h:908

quda::complex< float >::real
__host__ __device__ void real(float re)
Definition: complex_quda.h:527

quda::complex::imag
__host__ __device__ ValueType imag() const volatile

quda::tanh
__host__ __device__ complex< ValueType > tanh(const complex< ValueType > &z)
Definition: complex_quda.h:1031

quda::complex< float >::imag
__host__ __device__ void imag(float im)
Definition: complex_quda.h:528

quda::complex< float >::real
__host__ __device__ float real() const
Definition: complex_quda.h:523

quda::complex< float >
Definition: complex_quda.h:435

quda::operator>>
std::basic_istream< charT, traits > & operator>>(std::basic_istream< charT, traits > &is, complex< ValueType > &z)
Definition: complex_quda.h:303

quda::tan
__host__ __device__ ValueType tan(ValueType x)
Definition: complex_quda.h:45

quda::complex< double >::imag
__host__ __device__ double imag() const
Definition: complex_quda.h:625

quda::complex< double >::imag
__host__ __device__ void imag(double im) volatile
Definition: complex_quda.h:627

quda::complex::operator+=
__host__ __device__ complex< ValueType > & operator+=(const complex< ValueType > z)
Definition: complex_quda.h:392

quda::complex< float >::real
__host__ __device__ void real(float re) volatile
Definition: complex_quda.h:525

quda::complex< float >::operator=
__host__ __device__ complex< float > & operator=(const complex< T > z)
Definition: complex_quda.h:477

quda::complex< float >::value_type
float value_type
Definition: complex_quda.h:438

quda::tan
__host__ __device__ complex< ValueType > tan(const complex< ValueType > &z)
Definition: complex_quda.h:1025

quda::complex< float >::imag
__host__ __device__ float imag() const
Definition: complex_quda.h:524

quda::norm_type::type
T type
Definition: complex_quda.h:345

quda::complex::operator-=
__host__ __device__ complex< ValueType > & operator-=(const complex< ValueType > z)
Definition: complex_quda.h:400

quda::complex::operator*=
__host__ __device__ complex< ValueType > & operator*=(const complex< ValueType > z)
Definition: complex_quda.h:408

quda::asin
__host__ __device__ complex< ValueType > asin(const complex< ValueType > &z)
Definition: complex_quda.h:1048

quda::complex< float >::imag
__host__ __device__ void imag(float im) volatile
Definition: complex_quda.h:526

quda::norm_type
Definition: complex_quda.h:344

quda::sin
__host__ __device__ ValueType sin(ValueType x)
Definition: complex_quda.h:40

quda::acos
__host__ __device__ complex< ValueType > acos(const complex< ValueType > &z)
Definition: complex_quda.h:1041

quda::sin
__host__ __device__ complex< float > sin(const complex< float > &z)
Definition: complex_quda.h:989

quda::operator-
__host__ __device__ complex< ValueType > operator-(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:673

quda::complex< double >::real
__host__ __device__ void real(double re)
Definition: complex_quda.h:628

quda::atan2
__host__ __device__ ValueType atan2(ValueType x, ValueType y)
Definition: complex_quda.h:65

quda::cos
__host__ __device__ complex< float > cos(const complex< float > &z)
Definition: complex_quda.h:892

quda::pow
__host__ __device__ ValueType pow(ValueType x, ExponentType e)
Definition: complex_quda.h:100

quda::complex< double >::imag
__host__ __device__ void imag(double im)
Definition: complex_quda.h:629

quda::complex< float >::imag
__host__ __device__ float imag() const volatile
Definition: complex_quda.h:522

quda::complex::real
__host__ __device__ ValueType real() const volatile

quda::complex< float >::operator/=
__host__ __device__ complex< float > & operator/=(const complex< float > z)
Definition: complex_quda.h:508

quda::exp
__host__ __device__ complex< float > exp(const complex< float > &z)
Definition: complex_quda.h:923

quda::log
__host__ __device__ complex< float > log(const complex< float > &z)
Definition: complex_quda.h:935

quda::complex< double >::operator/=
__host__ __device__ complex< double > & operator/=(const complex< double > z)
Definition: complex_quda.h:609

x
int x[4]
Definition: hisq_paths_force_core.h:99

quda::log10
__host__ __device__ complex< ValueType > log10(const complex< ValueType > &z)
Definition: complex_quda.h:942

quda::complex::operator/=
__host__ __device__ complex< ValueType > & operator/=(const complex< ValueType > z)
Definition: complex_quda.h:415

quda::asinh
__host__ __device__ complex< ValueType > asinh(const complex< ValueType > &z)
Definition: complex_quda.h:1087

quda::complex::operator=
__host__ __device__ complex< ValueType > & operator=(const complex< T > z)
Definition: complex_quda.h:384

quda::log
__host__ __device__ ValueType log(ValueType x)
Definition: complex_quda.h:90

quda::complex< double >::imag
__host__ __device__ double imag() const volatile
Definition: complex_quda.h:623

quda::operator/
__host__ __device__ complex< ValueType > operator/(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:716

quda::complex< float >::operator=
__host__ __device__ volatile complex< float > & operator=(const complex< T > z) volatile
Definition: complex_quda.h:468

quda::log10
__host__ __device__ ValueType log10(ValueType x)
Definition: complex_quda.h:95

quda::operator*
__host__ __device__ complex< ValueType > operator*(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:692

quda::abs
__host__ __device__ double abs(const complex< double > &z)
Definition: complex_quda.h:837

z2
int z2
Definition: llfat_core.h:816

complex::im
float im
Definition: qio_util.h:19

quda::norm_type< complex< T > >::type
T type
Definition: complex_quda.h:349

quda::atan
__host__ __device__ complex< ValueType > atan(const complex< ValueType > &z)
Definition: complex_quda.h:1055

quda::arg
__host__ __device__ ValueType arg(const complex< ValueType > &z)
Returns the phase angle of z.
Definition: complex_quda.h:843

quda::sqrt
__host__ __device__ complex< float > sqrt(const complex< float > &z)
Definition: complex_quda.h:1019

quda::complex< double >::real
__host__ __device__ double real() const
Definition: complex_quda.h:624

quda::complex
Definition: complex_quda.h:119

quda::cos
__host__ __device__ ValueType cos(ValueType x)
Definition: complex_quda.h:35

quda::polar
__host__ __device__ complex< ValueType > polar(const ValueType &m, const ValueType &theta=0)
Returns the complex with magnitude m and angle theta in radians.
Definition: complex_quda.h:865

quda::abs
__host__ __device__ ValueType abs(ValueType x)
Definition: complex_quda.h:110

quda::complex< double >
Definition: complex_quda.h:536

quda::acos
__host__ __device__ ValueType acos(ValueType x)
Definition: complex_quda.h:50

quda::pow
__host__ __device__ complex< float > pow(const float &x, const complex< float > &exponent)
Definition: complex_quda.h:969

quda::conj
__host__ __device__ ValueType conj(ValueType x)
Definition: complex_quda.h:115

quda::operator+
__host__ __device__ complex< ValueType > operator+(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:644

quda::complex< double >::operator*=
__host__ __device__ complex< double > & operator*=(const complex< double > z)
Definition: complex_quda.h:602

quda::complex< double >::value_type
double value_type
Definition: complex_quda.h:539

quda::operator!=
__host__ __device__ bool operator!=(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:802

quda::atanh
__host__ __device__ complex< ValueType > atanh(const complex< ValueType > &z)
Definition: complex_quda.h:1093

quda::complex< float >::operator+=
__host__ __device__ complex< float > & operator+=(const complex< float > z)
Definition: complex_quda.h:485

quda::complex< double >::operator=
__host__ __device__ volatile complex< double > & operator=(const complex< T > z) volatile
Definition: complex_quda.h:569

quda::complex< double >::real
__host__ __device__ double real() const volatile
Definition: complex_quda.h:622

quda::complex< float >::real
__host__ __device__ float real() const volatile
Definition: complex_quda.h:521

quda::acosh
__host__ __device__ complex< ValueType > acosh(const complex< ValueType > &z)
Definition: complex_quda.h:1062

quda::operator==
__host__ __device__ bool operator==(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:777

complex::re
float re
Definition: qio_util.h:18

quda::asin
__host__ __device__ ValueType asin(ValueType x)
Definition: complex_quda.h:55

quda::complex< double >::operator+=
__host__ __device__ complex< double > & operator+=(const complex< double > z)
Definition: complex_quda.h:586