v0.9.0/doc/complex__quda_8h_source.html

 /*
  *  Copyright 2008-2009 NVIDIA Corporation
  *
  *  Licensed under the Apache License, Version 2.0 (the "License");
  *  you may not use this file except in compliance with the License.
  *  You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  *  Unless required by applicable law or agreed to in writing, software
  *  distributed under the License is distributed on an "AS IS" BASIS,
  *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  *  See the License for the specific language governing permissions and
  *  limitations under the License.
  */

 #pragma once

 #include <math.h>
 #include <cmath>
 #include <complex>
 #include <sstream>
 #include <cuComplex.h>

 // We need this to make sure code inside quda:: that calls sqrt() using real numbers
 // doesn't try to call the complex sqrt, but the standard sqrt
 namespace quda
 {
   template <typename ValueType>
     __host__ __device__
     inline ValueType cos(ValueType x){
     return std::cos(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType sin(ValueType x){
     return std::sin(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType tan(ValueType x){
     return std::tan(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType acos(ValueType x){
     return std::acos(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType asin(ValueType x){
     return std::asin(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType atan(ValueType x){
     return std::atan(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType atan2(ValueType x,ValueType y){
     return std::atan2(x,y);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType cosh(ValueType x){
     return std::cosh(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType sinh(ValueType x){
     return std::sinh(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType tanh(ValueType x){
     return std::tanh(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType exp(ValueType x){
     return std::exp(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType log(ValueType x){
     return std::log(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType log10(ValueType x){
     return std::log10(x);
   }
   template <typename ValueType, typename ExponentType>
     __host__ __device__
     inline ValueType pow(ValueType x, ExponentType e){
     return std::pow(x,e);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType sqrt(ValueType x){
     return std::sqrt(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType abs(ValueType x){
     return std::abs(x);
   }
   template <typename ValueType>
     __host__ __device__
     inline ValueType conj(ValueType x){
     return x;
   }

   template <typename ValueType> struct complex;
   template <> struct complex<float>;
   template <> struct complex<double>;


   template<typename ValueType>
   __host__ __device__
   ValueType abs(const complex<ValueType>& z);
   template<typename ValueType>
   __host__ __device__
   ValueType arg(const complex<ValueType>& z);
   template<typename ValueType>
   __host__ __device__
   ValueType norm(const complex<ValueType>& z);

   template<typename ValueType>
   __host__ __device__
   complex<ValueType> conj(const complex<ValueType>& z);

   template<typename ValueType>
   __host__ __device__
   complex<ValueType> polar(const ValueType& m, const ValueType& theta = 0);

   // Arithmetic operators:
   // Multiplication
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator*(const complex<ValueType>& lhs, const complex<ValueType>& rhs);
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator*(const complex<ValueType>& lhs, const ValueType & rhs);
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator*(const ValueType& lhs, const complex<ValueType>& rhs);
   // Division
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator/(const complex<ValueType>& lhs, const complex<ValueType>& rhs);
   template <>
     __host__ __device__
     inline complex<float> operator/(const complex<float>& lhs, const complex<float>& rhs);
   template <>
     __host__ __device__
     inline complex<double> operator/(const complex<double>& lhs, const complex<double>& rhs);

   // Addition
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const complex<ValueType>& lhs, const complex<ValueType>& rhs);
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const complex<ValueType>& lhs, const ValueType & rhs);
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const ValueType& lhs, const complex<ValueType>& rhs);
   // Subtraction
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator-(const complex<ValueType>& lhs, const complex<ValueType>& rhs);
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator-(const complex<ValueType>& lhs, const ValueType & rhs);
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator-(const ValueType& lhs, const complex<ValueType>& rhs);

   // Unary plus and minus
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const complex<ValueType>& rhs);
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator-(const complex<ValueType>& rhs);

   // Transcendentals:
   // Returns the complex cosine of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> cos(const complex<ValueType>& z);
   // Returns the complex hyperbolic cosine of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> cosh(const complex<ValueType>& z);
   // Returns the complex base e exponential of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> exp(const complex<ValueType>& z);
   // Returns the complex natural logarithm of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> log(const complex<ValueType>& z);
   // Returns the complex base 10 logarithm of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> log10(const complex<ValueType>& z);
   // Returns z to the n'th power.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> pow(const complex<ValueType>& z, const int& n);
   // Returns z to the x'th power.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> pow(const complex<ValueType>&z, const ValueType&x);
   // Returns z to the z2'th power.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> pow(const complex<ValueType>&z, const complex<ValueType>&z2);
   // Returns x to the z'th power.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> pow(const ValueType& x, const complex<ValueType>& z);
   // Returns the complex sine of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> sin(const complex<ValueType>&z);
   // Returns the complex hyperbolic sine of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> sinh(const complex<ValueType>&z);
   // Returns the complex square root of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> sqrt(const complex<ValueType>&z);
   // Returns the complex tangent of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> tan(const complex<ValueType>&z);
   // Returns the complex hyperbolic tangent of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> tanh(const complex<ValueType>&z);


   // Inverse Trigonometric:
   // Returns the complex arc cosine of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> acos(const complex<ValueType>& z);
   // Returns the complex arc sine of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> asin(const complex<ValueType>& z);
   // Returns the complex arc tangent of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> atan(const complex<ValueType>& z);
   // Returns the complex hyperbolic arc cosine of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> acosh(const complex<ValueType>& z);
   // Returns the complex hyperbolic arc sine of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> asinh(const complex<ValueType>& z);
   // Returns the complex hyperbolic arc tangent of z.
   template <typename ValueType>
     __host__ __device__
   complex<ValueType> atanh(const complex<ValueType>& z);


   // Stream operators:
   template<typename ValueType,class charT, class traits>
     std::basic_ostream<charT, traits>& operator<<(std::basic_ostream<charT, traits>& os, const complex<ValueType>& z);
   template<typename ValueType, typename charT, class traits>
     std::basic_istream<charT, traits>&
     operator>>(std::basic_istream<charT, traits>& is, complex<ValueType>& z);


   // Stream operators
   template<typename ValueType,class charT, class traits>
     std::basic_ostream<charT, traits>& operator<<(std::basic_ostream<charT, traits>& os, const complex<ValueType>& z)
     {
       os << '(' << z.real() << ',' << z.imag() << ')';
       return os;
     };

   template<typename ValueType, typename charT, class traits>
     std::basic_istream<charT, traits>&
     operator>>(std::basic_istream<charT, traits>& is, complex<ValueType>& z)
     {
       ValueType re, im;

       charT ch;
       is >> ch;

       if(ch == '(')
       {
         is >> re >> ch;
         if (ch == ',')
         {
           is >> im >> ch;
           if (ch == ')')
           {
             z = complex<ValueType>(re, im);
           }
           else
           {
             is.setstate(std::ios_base::failbit);
           }
         }
         else if (ch == ')')
         {
           z = re;
         }
         else
         {
           is.setstate(std::ios_base::failbit);
         }
       }
       else
       {
         is.putback(ch);
         is >> re;
         z = re;
       }
       return is;
     }

 template <typename T>
   struct norm_type {
     typedef T type;
   };
  template <typename T>
    struct norm_type< complex<T> > {
    typedef T type;
  };

 template <typename ValueType>
 struct complex
 {
 public:
   typedef ValueType value_type;

   // Constructors
   __host__ __device__
     inline complex<ValueType>(const ValueType & re = ValueType(), const ValueType& im = ValueType())
     {
       real(re);
       imag(im);
     }

   template <class X>
     __host__ __device__
     inline complex<ValueType>(const complex<X> & z)
     {
       real(z.real());
       imag(z.imag());
     }

   template <class X>
     __host__ __device__
     inline complex<ValueType>(const std::complex<X> & z)
     {
       real(z.real());
       imag(z.imag());
     }

   template <typename T>
     __host__ __device__
     inline complex<ValueType>& operator=(const complex<T> z)
     {
       real(z.real());
       imag(z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<ValueType>& operator+=(const complex<ValueType> z)
     {
       real(real()+z.real());
       imag(imag()+z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<ValueType>& operator-=(const complex<ValueType> z)
     {
       real(real()-z.real());
       imag(imag()-z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<ValueType>& operator*=(const complex<ValueType> z)
     {
       *this = *this * z;
       return *this;
     }

   __host__ __device__
     inline complex<ValueType>& operator/=(const complex<ValueType> z)
     {
       *this = *this / z;
       return *this;
     }

   __host__ __device__
     inline complex<ValueType>& operator*=(const ValueType z)
     {
       this->x *= z;
       this->y *= z;
       return *this;
     }

   __host__ __device__ inline ValueType real() const volatile;
   __host__ __device__ inline ValueType imag() const volatile;
   __host__ __device__ inline ValueType real() const;
   __host__ __device__ inline ValueType imag() const;
   __host__ __device__ inline void real(ValueType) volatile;
   __host__ __device__ inline void imag(ValueType) volatile;
   __host__ __device__ inline void real(ValueType);
   __host__ __device__ inline void imag(ValueType);
 };

 // TODO make cuFloatComplex and cuDoubleComplex protected
 // TODO see if returning references is a perf hazard

 template<>
 struct complex <float> : public cuFloatComplex
 {
 public:
   typedef float value_type;
   __host__ __device__
     inline complex<float>(){};
   __host__ __device__
     inline complex<float>(const float & re, const float& im = float())
     {
       real(re);
       imag(im);
     }

   // For some reason having the following constructor
   // explicitly makes things faster with at least g++
   __host__ __device__
     complex<float>(const complex<float> & z)
     : cuFloatComplex(z){}

   __host__ __device__
     complex<float>(cuFloatComplex z)
     : cuFloatComplex(z){}

   template <class X>
     inline complex<float>(const std::complex<X> & z)
     {
       real(z.real());
       imag(z.imag());
     }

   // Member operators
   template <typename T>
     __host__ __device__
     inline volatile complex<float>& operator=(const complex<T> z) volatile
     {
       real(z.real());
       imag(z.imag());
       return *this;
     }

   template <typename T>
     __host__ __device__
     inline complex<float>& operator=(const complex<T> z)
     {
       real(z.real());
       imag(z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<float>& operator+=(const complex<float> z)
     {
       real(real()+z.real());
       imag(imag()+z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<float>& operator-=(const complex<float> z)
     {
       real(real()-z.real());
       imag(imag()-z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<float>& operator*=(const complex<float> z)
     {
       *this = *this * z;
       return *this;
     }

   __host__ __device__
     inline complex<float>& operator/=(const complex<float> z)
     {
       *this = *this / z;
       return *this;
     }

   __host__ __device__
     inline complex<float>& operator*=(const float z)
     {
       this->x *= z;
       this->y *= z;
       return *this;
     }

   // Let the compiler synthesize the copy and assignment operators.
   __host__ __device__ inline complex<float>(const volatile complex<float> & z)
   {
     real(z.real());
     imag(z.imag());
   }

   __host__ __device__ inline float real() const volatile{ return x; }
   __host__ __device__ inline float imag() const volatile{ return y; }
   __host__ __device__ inline float real() const{ return x; }
   __host__ __device__ inline float imag() const{ return y; }
   __host__ __device__ inline void real(float re)volatile{ x = re; }
   __host__ __device__ inline void imag(float im)volatile{ y = im; }
   __host__ __device__ inline void real(float re){ x = re; }
   __host__ __device__ inline void imag(float im){ y = im; }

   // cast operators
   inline operator std::complex<float>() const { return std::complex<float>(real(),imag()); }
   template <typename T>
   inline __host__ __device__ operator complex<T>() const { return complex<T>(static_cast<T>(real()),static_cast<T>(imag())); }
   // inline operator float() const { return real(); }
 };

 template<>
 struct complex <double> : public cuDoubleComplex
 {
 public:
   typedef double value_type;
   __host__ __device__
     inline complex<double>(){};
   __host__ __device__
     inline complex<double>(const double & re, const double& im = double())
     {
       real(re);
       imag(im);
     }

   // For some reason having the following constructor
   // explicitly makes things faster with at least g++
   __host__ __device__
     inline complex<double>(const complex<double> & z)
     : cuDoubleComplex(z) {}

   __host__ __device__
     inline complex<double>(cuDoubleComplex z)
     : cuDoubleComplex(z) {}

   template <class X>
     inline complex<double>(const std::complex<X> & z)
     {
       real(z.real());
       imag(z.imag());
     }

   // Member operators
   template <typename T>
     __host__ __device__
     inline volatile complex<double>& operator=(const complex<T> z) volatile
     {
       real(z.real());
       imag(z.imag());
       return *this;
     }

   template <typename T>
     __host__ __device__
     inline complex<double>& operator=(const complex<T> z)
     {
       real(z.real());
       imag(z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<double>& operator+=(const complex<double> z)
     {
       real(real()+z.real());
       imag(imag()+z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<double>& operator+=(const complex<float> z)
     {
       real(real()+z.real());
       imag(imag()+z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<double>& operator-=(const complex<double> z)
     {
       real(real()-z.real());
       imag(imag()-z.imag());
       return *this;
     }

   __host__ __device__
     inline complex<double>& operator*=(const complex<double> z)
     {
       *this = *this * z;
       return *this;
     }

   __host__ __device__
     inline complex<double>& operator/=(const complex<double> z)
     {
       *this = *this / z;
       return *this;
     }

   __host__ __device__
     inline complex<double>& operator*=(const double z)
     {
       this->x *= z;
       this->y *= z;
       return *this;
     }

   __host__ __device__ inline complex<double>(const volatile complex<double> & z)
   {
     real(z.real());
     imag(z.imag());
   }

   // Let the compiler synthesize the copy and assignment operators.
   __host__ __device__ inline double real() const volatile { return x; }
   __host__ __device__ inline double imag() const volatile { return y; }
   __host__ __device__ inline double real() const { return x; }
   __host__ __device__ inline double imag() const { return y; }
   __host__ __device__ inline void real(double re)volatile{ x = re; }
   __host__ __device__ inline void imag(double im)volatile{ y = im; }
   __host__ __device__ inline void real(double re){ x = re; }
   __host__ __device__ inline void imag(double im){ y = im; }

   // cast operators
   inline operator std::complex<double>() const { return std::complex<double>(real(),imag()); }

   template <typename T>
   inline __host__ __device__ operator complex<T>() const { return complex<T>(static_cast<T>(real()),static_cast<T>(imag())); }
   // inline operator double() { return real(); }
 };

   // Binary arithmetic operations
   // At the moment I'm implementing the basic functions, and the
   // corresponding cuComplex calls are commented.

   template<typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const complex<ValueType>& lhs,
 const complex<ValueType>& rhs){
     return complex<ValueType>(lhs.real()+rhs.real(),lhs.imag()+rhs.imag());
     // return cuCaddf(lhs,rhs);
   }

   template<typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const volatile complex<ValueType>& lhs,
 const volatile complex<ValueType>& rhs){
     return complex<ValueType>(lhs.real()+rhs.real(),lhs.imag()+rhs.imag());
     // return cuCaddf(lhs,rhs);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const complex<ValueType>& lhs, const ValueType & rhs){
     return complex<ValueType>(lhs.real()+rhs,lhs.imag());
     // return cuCaddf(lhs,complex<ValueType>(rhs));
   }
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const ValueType& lhs, const complex<ValueType>& rhs){
     return complex<ValueType>(rhs.real()+lhs,rhs.imag());
     // return cuCaddf(complex<float>(lhs),rhs);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator-(const complex<ValueType>& lhs, const complex<ValueType>& rhs){
     return complex<ValueType>(lhs.real()-rhs.real(),lhs.imag()-rhs.imag());
     // return cuCsubf(lhs,rhs);
   }
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator-(const complex<ValueType>& lhs, const ValueType & rhs){
     return complex<ValueType>(lhs.real()-rhs,lhs.imag());
     // return cuCsubf(lhs,complex<float>(rhs));
   }
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator-(const ValueType& lhs, const complex<ValueType>& rhs){
     return complex<ValueType>(lhs-rhs.real(),-rhs.imag());
     // return cuCsubf(complex<float>(lhs),rhs);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator*(const complex<ValueType>& lhs,
 const complex<ValueType>& rhs){
     return complex<ValueType>(lhs.real()*rhs.real()-lhs.imag()*rhs.imag(),
 lhs.real()*rhs.imag()+lhs.imag()*rhs.real());
     // return cuCmulf(lhs,rhs);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator*(const complex<ValueType>& lhs, const ValueType & rhs){
     return complex<ValueType>(lhs.real()*rhs,lhs.imag()*rhs);
     // return cuCmulf(lhs,complex<float>(rhs));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator*(const ValueType& lhs, const complex<ValueType>& rhs){
     return complex<ValueType>(rhs.real()*lhs,rhs.imag()*lhs);
     // return cuCmulf(complex<float>(lhs),rhs);
   }


   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator/(const complex<ValueType>& lhs, const complex<ValueType>& rhs){
     const ValueType cross_norm = lhs.real() * rhs.real() + lhs.imag() * rhs.imag();
     const ValueType rhs_norm = norm(rhs);
     return complex<ValueType>(cross_norm/rhs_norm,
 (lhs.imag() * rhs.real() - lhs.real() * rhs.imag()) / rhs_norm);
   }

   template <>
     __host__ __device__
     inline complex<float> operator/(const complex<float>& lhs, const complex<float>& rhs){
     return cuCdivf(lhs,rhs);
   }

   template <>
     __host__ __device__
     inline complex<double> operator/(const complex<double>& lhs, const complex<double>& rhs){
     return cuCdiv(lhs,rhs);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator/(const complex<ValueType>& lhs, const ValueType & rhs){
     return complex<ValueType>(lhs.real()/rhs,lhs.imag()/rhs);
     // return cuCdivf(lhs,complex<float>(rhs));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator/(const ValueType& lhs, const complex<ValueType>& rhs){
     const ValueType cross_norm = lhs * rhs.real();
     const ValueType rhs_norm = norm(rhs);
     return complex<ValueType>(cross_norm/rhs_norm,(-lhs.real() * rhs.imag()) / rhs_norm);
   }

   template <>
     __host__ __device__
     inline complex<float> operator/(const float& lhs, const complex<float>& rhs){
     return cuCdivf(complex<float>(lhs),rhs);
   }
   template <>
     __host__ __device__
     inline complex<double> operator/(const double& lhs, const complex<double>& rhs){
     return cuCdiv(complex<double>(lhs),rhs);
   }


   // Unary arithmetic operations
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator+(const complex<ValueType>& rhs){
     return rhs;
   }
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> operator-(const complex<ValueType>& rhs){
     return rhs*-ValueType(1);
   }

   // Equality operators
   template <typename ValueType>
     __host__ __device__
     inline bool operator==(const complex<ValueType>& lhs, const complex<ValueType>& rhs){
     if(lhs.real() == rhs.real() && lhs.imag() == rhs.imag()){
       return true;
     }
     return false;
   }

   template <typename ValueType>
     __host__ __device__
     inline bool operator==(const ValueType & lhs, const complex<ValueType>& rhs){
     if(lhs == rhs.real() && rhs.imag() == 0){
       return true;
     }
     return false;
   }
   template <typename ValueType>
     __host__ __device__
     inline bool operator==(const complex<ValueType> & lhs, const ValueType& rhs){
     if(lhs.real() == rhs && lhs.imag() == 0){
       return true;
     }
     return false;
   }


   template <typename ValueType>
     __host__ __device__
     inline bool operator!=(const complex<ValueType>& lhs, const complex<ValueType>& rhs){
     return !(lhs == rhs);
   }

   template <typename ValueType>
     __host__ __device__
     inline bool operator!=(const ValueType & lhs, const complex<ValueType>& rhs){
     return !(lhs == rhs);
   }

   template <typename ValueType>
     __host__ __device__
     inline bool operator!=(const complex<ValueType> & lhs, const ValueType& rhs){
     return !(lhs == rhs);
   }


   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> conj(const complex<ValueType>& z){
     return complex<ValueType>(z.real(),-z.imag());
   }

   template <typename ValueType>
     __host__ __device__
     inline ValueType abs(const complex<ValueType>& z){
     return ::hypot(z.real(),z.imag());
   }
   template <>
     __host__ __device__
     inline float abs(const complex<float>& z){
     return ::hypotf(z.real(),z.imag());
   }
   template<>
     __host__ __device__
     inline double abs(const complex<double>& z){
     return ::hypot(z.real(),z.imag());
   }

   template <typename ValueType>
     __host__ __device__
     inline ValueType arg(const complex<ValueType>& z){
     return atan2(z.imag(),z.real());
   }
   template<>
     __host__ __device__
     inline float arg(const complex<float>& z){
     return atan2f(z.imag(),z.real());
   }
   template<>
     __host__ __device__
     inline double arg(const complex<double>& z){
     return atan2(z.imag(),z.real());
   }

   template <typename ValueType>
     __host__ __device__
     inline ValueType norm(const complex<ValueType>& z){
     return z.real()*z.real() + z.imag()*z.imag();
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> polar(const ValueType & m, const ValueType & theta){
     return complex<ValueType>(m * ::cos(theta),m * ::sin(theta));
   }

   template <>
     __host__ __device__
     inline complex<float> polar(const float & magnitude, const float & angle){
     return complex<float>(magnitude * ::cosf(angle),magnitude * ::sinf(angle));
   }

   template <>
     __host__ __device__
     inline complex<double> polar(const double & magnitude, const double & angle){
     return complex<double>(magnitude * ::cos(angle),magnitude * ::sin(angle));
   }

   // Transcendental functions implementation
   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> cos(const complex<ValueType>& z){
     const ValueType re = z.real();
     const ValueType im = z.imag();
     return complex<ValueType>(::cos(re) * ::cosh(im), -::sin(re) * ::sinh(im));
   }

   template <>
     __host__ __device__
     inline complex<float> cos(const complex<float>& z){
     const float re = z.real();
     const float im = z.imag();
     return complex<float>(cosf(re) * coshf(im), -sinf(re) * sinhf(im));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> cosh(const complex<ValueType>& z){
     const ValueType re = z.real();
     const ValueType im = z.imag();
     return complex<ValueType>(::cosh(re) * ::cos(im), ::sinh(re) * ::sin(im));
   }

   template <>
     __host__ __device__
     inline complex<float> cosh(const complex<float>& z){
     const float re = z.real();
     const float im = z.imag();
     return complex<float>(::coshf(re) * ::cosf(im), ::sinhf(re) * ::sinf(im));
   }


   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> exp(const complex<ValueType>& z){
     return polar(::exp(z.real()),z.imag());
   }

   template <>
     __host__ __device__
     inline complex<float> exp(const complex<float>& z){
     return polar(::expf(z.real()),z.imag());
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> log(const complex<ValueType>& z){
     return complex<ValueType>(::log(abs(z)),arg(z));
   }

   template <>
     __host__ __device__
     inline complex<float> log(const complex<float>& z){
     return complex<float>(::logf(abs(z)),arg(z));
   }


   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> log10(const complex<ValueType>& z){
     // Using the explicit literal prevents compile time warnings in
     // devices that don't support doubles
     return log(z)/ValueType(2.30258509299404568402);
     // return log(z)/ValueType(::log(10.0));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> pow(const complex<ValueType>& z, const ValueType & exponent){
     return exp(log(z)*exponent);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> pow(const complex<ValueType>& z, const complex<ValueType> & exponent){
     return exp(log(z)*exponent);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> pow(const ValueType & x, const complex<ValueType> & exponent){
     return exp(::log(x)*exponent);
   }

   template <>
     __host__ __device__
     inline complex<float> pow(const float & x, const complex<float> & exponent){
     return exp(::logf(x)*exponent);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> pow(const complex<ValueType>& z,const int & exponent){
     return exp(log(z)*ValueType(exponent));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> sin(const complex<ValueType>& z){
     const ValueType re = z.real();
     const ValueType im = z.imag();
     return complex<ValueType>(::sin(re) * ::cosh(im), ::cos(re) * ::sinh(im));
   }

   template <>
     __host__ __device__
     inline complex<float> sin(const complex<float>& z){
     const float re = z.real();
     const float im = z.imag();
     return complex<float>(::sinf(re) * ::coshf(im), ::cosf(re) * ::sinhf(im));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> sinh(const complex<ValueType>& z){
     const ValueType re = z.real();
     const ValueType im = z.imag();
     return complex<ValueType>(::sinh(re) * ::cos(im), ::cosh(re) * ::sin(im));
   }

   template <>
     __host__ __device__
     inline complex<float> sinh(const complex<float>& z){
     const float re = z.real();
     const float im = z.imag();
     return complex<float>(::sinhf(re) * ::cosf(im), ::coshf(re) * ::sinf(im));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> sqrt(const complex<ValueType>& z){
     return polar(::sqrt(abs(z)),arg(z)/ValueType(2));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<float> sqrt(const complex<float>& z){
     return polar(::sqrtf(abs(z)),arg(z)/float(2));
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> tan(const complex<ValueType>& z){
     return sin(z)/cos(z);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> tanh(const complex<ValueType>& z){
     // This implementation seems better than the simple sin/cos
     return (exp(ValueType(2)*z)-ValueType(1))/(exp(ValueType(2)*z)+ValueType(1));
     // return sinh(z)/cosh(z);
   }

   // Inverse trigonometric functions implementation

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> acos(const complex<ValueType>& z){
     const complex<ValueType> ret = asin(z);
     return complex<ValueType>(ValueType(M_PI/2.0) - ret.real(),-ret.imag());
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> asin(const complex<ValueType>& z){
     const complex<ValueType> i(0,1);
     return -i*asinh(i*z);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> atan(const complex<ValueType>& z){
     const complex<ValueType> i(0,1);
     return -i*atanh(i*z);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> acosh(const complex<ValueType>& z){
     quda::complex<ValueType> ret((z.real() - z.imag()) * (z.real() + z.imag()) - ValueType(1.0),
          ValueType(2.0) * z.real() * z.imag());
     ret = sqrt(ret);
     if (z.real() < ValueType(0.0)){
       ret = -ret;
     }
     ret += z;
     ret = log(ret);
     if (ret.real() < ValueType(0.0)){
       ret = -ret;
     }
     return ret;

     /*
       quda::complex<ValueType> ret = log(sqrt(z*z-ValueType(1))+z);
       if(ret.real() < 0){
       ret.real(-ret.real());
       }
       return ret;
     */
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> asinh(const complex<ValueType>& z){
     return log(sqrt(z*z+ValueType(1))+z);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<ValueType> atanh(const complex<ValueType>& z){
     ValueType imag2 = z.imag() * z.imag();
     ValueType n = ValueType(1.0) + z.real();
     n = imag2 + n * n;

     ValueType d = ValueType(1.0) - z.real();
     d = imag2 + d * d;
     complex<ValueType> ret(ValueType(0.25) * (::log(n) - ::log(d)),0);

     d = ValueType(1.0) - z.real() * z.real() - imag2;

     ret.imag(ValueType(0.5) * ::atan2(ValueType(2.0) * z.imag(), d));
     return ret;
     //return (log(ValueType(1)+z)-log(ValueType(1)-z))/ValueType(2);
   }

   template <typename ValueType>
     __host__ __device__
     inline complex<float> atanh(const complex<float>& z){
     float imag2 = z.imag() * z.imag();
     float n = float(1.0) + z.real();
     n = imag2 + n * n;

     float d = float(1.0) - z.real();
     d = imag2 + d * d;
     complex<float> ret(float(0.25) * (::logf(n) - ::logf(d)),0);

     d = float(1.0) - z.real() * z.real() - imag2;

     ret.imag(float(0.5) * ::atan2f(float(2.0) * z.imag(), d));
     return ret;
     //return (log(ValueType(1)+z)-log(ValueType(1)-z))/ValueType(2);

   }

 } // end namespace quda
quda::sinh
__host__ __device__ complex< float > sinh(const complex< float > &z)
Definition: complex_quda.h:1042

quda::tanh
__host__ __device__ ValueType tanh(ValueType x)
Definition: complex_quda.h:80

cosf
float cosf(float)

quda::sinh
__host__ __device__ ValueType sinh(ValueType x)
Definition: complex_quda.h:75

quda::complex< float >::operator-=
__host__ __device__ complex< float > & operator-=(const complex< float > z)
Definition: complex_quda.h:501

quda::complex< double >::operator=
__host__ __device__ complex< double > & operator=(const complex< T > z)
Definition: complex_quda.h:596

quda::complex::value_type
ValueType value_type
Definition: complex_quda.h:356

quda::norm
__host__ __device__ ValueType norm(const complex< ValueType > &z)
Returns the magnitude of z squared.
Definition: complex_quda.h:896

quda::complex< double >::operator+=
__host__ __device__ complex< double > & operator+=(const complex< float > z)
Definition: complex_quda.h:612

quda::atan
__host__ __device__ ValueType atan(ValueType x)
Definition: complex_quda.h:60

quda::complex< double >::operator-=
__host__ __device__ complex< double > & operator-=(const complex< double > z)
Definition: complex_quda.h:620

quda::exp
__host__ __device__ ValueType exp(ValueType x)
Definition: complex_quda.h:85

quda::complex< float >::operator*=
__host__ __device__ complex< float > & operator*=(const complex< float > z)
Definition: complex_quda.h:509

quda::cosh
__host__ __device__ ValueType cosh(ValueType x)
Definition: complex_quda.h:70

quda::complex< double >::real
__host__ __device__ void real(double re) volatile
Definition: complex_quda.h:660

quda::sqrt
__host__ __device__ ValueType sqrt(ValueType x)
Definition: complex_quda.h:105

quda::cosh
__host__ __device__ complex< float > cosh(const complex< float > &z)
Definition: complex_quda.h:945

quda::complex< float >::real
__host__ __device__ void real(float re)
Definition: complex_quda.h:543

coshf
float coshf(float)

quda::complex::imag
__host__ __device__ ValueType imag() const volatile

quda::tanh
__host__ __device__ complex< ValueType > tanh(const complex< ValueType > &z)
Definition: complex_quda.h:1068

quda::complex< float >::imag
__host__ __device__ void imag(float im)
Definition: complex_quda.h:544

z
int int z
Definition: CMakeCUDACompilerId.cpp1.ii:2637

quda::complex< float >
Definition: complex_quda.h:443

quda::operator>>
std::basic_istream< charT, traits > & operator>>(std::basic_istream< charT, traits > &is, complex< ValueType > &z)
Definition: complex_quda.h:303

quda::complex< double >::imag
__host__ __device__ double imag() const
Definition: complex_quda.h:659

quda::tan
__host__ __device__ ValueType tan(ValueType x)
Definition: complex_quda.h:45

ret
return ret
Definition: CMakeCUDACompilerId.cpp1.ii:13161

quda::complex< double >::imag
__host__ __device__ void imag(double im) volatile
Definition: complex_quda.h:661

quda
Definition: blas_cublas.h:6

quda::complex::operator+=
__host__ __device__ complex< ValueType > & operator+=(const complex< ValueType > z)
Definition: complex_quda.h:392

quda::complex< float >::real
__host__ __device__ void real(float re) volatile
Definition: complex_quda.h:541

quda::complex< float >::operator=
__host__ __device__ complex< float > & operator=(const complex< T > z)
Definition: complex_quda.h:485

quda::complex< float >::value_type
float value_type
Definition: complex_quda.h:446

quda::tan
__host__ __device__ complex< ValueType > tan(const complex< ValueType > &z)
Definition: complex_quda.h:1062

quda::norm_type::type
T type
Definition: complex_quda.h:345

x
p x
Definition: CMakeCUDACompilerId.cpp1.ii:3011

quda::complex::operator-=
__host__ __device__ complex< ValueType > & operator-=(const complex< ValueType > z)
Definition: complex_quda.h:400

quda::complex::operator*=
__host__ __device__ complex< ValueType > & operator*=(const complex< ValueType > z)
Definition: complex_quda.h:408

quda::asin
__host__ __device__ complex< ValueType > asin(const complex< ValueType > &z)
Definition: complex_quda.h:1085

quda::complex< float >::imag
__host__ __device__ void imag(float im) volatile
Definition: complex_quda.h:542

quda::norm_type
Definition: complex_quda.h:344

quda::sin
__host__ __device__ ValueType sin(ValueType x)
Definition: complex_quda.h:40

quda::acos
__host__ __device__ complex< ValueType > acos(const complex< ValueType > &z)
Definition: complex_quda.h:1078

atan2f
float atan2f(float, float)

quda::sin
__host__ __device__ complex< float > sin(const complex< float > &z)
Definition: complex_quda.h:1026

quda::complex< double >::real
__host__ __device__ void real(double re)
Definition: complex_quda.h:662

quda::atan2
__host__ __device__ ValueType atan2(ValueType x, ValueType y)
Definition: complex_quda.h:65

quda::operator-
__device__ __host__ ColorSpinor< Float, Nc, Ns > operator-(const ColorSpinor< Float, Nc, Ns > &x, const ColorSpinor< Float, Nc, Ns > &y)
ColorSpinor subtraction operator.
Definition: color_spinor.h:907

fused_exterior_ndeg_tm_dslash_cuda_gen.i
int i
start here
Definition: fused_exterior_ndeg_tm_dslash_cuda_gen.py:816

double
double
Definition: CMakeCUDACompilerId.cpp1.ii:8010

quda::cos
__host__ __device__ complex< float > cos(const complex< float > &z)
Definition: complex_quda.h:929

quda::pow
__host__ __device__ ValueType pow(ValueType x, ExponentType e)
Definition: complex_quda.h:100

quda::complex< double >::imag
__host__ __device__ void imag(double im)
Definition: complex_quda.h:663

quda::complex< float >::imag
__host__ __device__ float imag() const volatile
Definition: complex_quda.h:538

quda::complex::real
__host__ __device__ ValueType real() const volatile

quda::complex< float >::operator/=
__host__ __device__ complex< float > & operator/=(const complex< float > z)
Definition: complex_quda.h:516

quda::complex< float >::real
__host__ __device__ float real() const
Definition: complex_quda.h:539

quda::exp
__host__ __device__ complex< float > exp(const complex< float > &z)
Definition: complex_quda.h:960

sinhf
float sinhf(float)

quda::log
__host__ __device__ complex< float > log(const complex< float > &z)
Definition: complex_quda.h:972

quda::complex< double >::operator/=
__host__ __device__ complex< double > & operator/=(const complex< double > z)
Definition: complex_quda.h:635

quda::log10
__host__ __device__ complex< ValueType > log10(const complex< ValueType > &z)
Definition: complex_quda.h:979

quda::complex::operator/=
__host__ __device__ complex< ValueType > & operator/=(const complex< ValueType > z)
Definition: complex_quda.h:415

quda::asinh
__host__ __device__ complex< ValueType > asinh(const complex< ValueType > &z)
Definition: complex_quda.h:1124

quda::complex::operator*=
__host__ __device__ complex< ValueType > & operator*=(const ValueType z)
Definition: complex_quda.h:422

quda::complex::operator=
__host__ __device__ complex< ValueType > & operator=(const complex< T > z)
Definition: complex_quda.h:384

quda::log
__host__ __device__ ValueType log(ValueType x)
Definition: complex_quda.h:90

quda::complex< double >::imag
__host__ __device__ double imag() const volatile
Definition: complex_quda.h:657

quda::complex< float >::operator*=
__host__ __device__ complex< float > & operator*=(const float z)
Definition: complex_quda.h:523

quda::operator/
__host__ __device__ complex< ValueType > operator/(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:751

quda::complex< float >::operator=
__host__ __device__ volatile complex< float > & operator=(const complex< T > z) volatile
Definition: complex_quda.h:476

logf
float logf(float)

quda::log10
__host__ __device__ ValueType log10(ValueType x)
Definition: complex_quda.h:95

hypot
double hypot(double, double)

quda::abs
__host__ __device__ double abs(const complex< double > &z)
Definition: complex_quda.h:874

quda::operator+
__device__ __host__ ColorSpinor< Float, Nc, Ns > operator+(const ColorSpinor< Float, Nc, Ns > &x, const ColorSpinor< Float, Nc, Ns > &y)
ColorSpinor addition operator.
Definition: color_spinor.h:885

n
int n
Definition: CMakeCUDACompilerId.cpp1.ii:8086

sinf
float sinf(float)

quda::complex< double >::operator*=
__host__ __device__ complex< double > & operator*=(const double z)
Definition: complex_quda.h:642

expf
float expf(float)

e
return e
Definition: CMakeCUDACompilerId.cpp1.ii:3026

quda::norm_type< complex< T > >::type
T type
Definition: complex_quda.h:349

quda::atan
__host__ __device__ complex< ValueType > atan(const complex< ValueType > &z)
Definition: complex_quda.h:1092

quda::arg
__host__ __device__ ValueType arg(const complex< ValueType > &z)
Returns the phase angle of z.
Definition: complex_quda.h:880

quda::sqrt
__host__ __device__ complex< float > sqrt(const complex< float > &z)
Definition: complex_quda.h:1056

quda::complex< double >::real
__host__ __device__ double real() const
Definition: complex_quda.h:658

quda::cos
__host__ __device__ ValueType cos(ValueType x)
Definition: complex_quda.h:35

quda::polar
__host__ __device__ complex< ValueType > polar(const ValueType &m, const ValueType &theta=0)
Returns the complex with magnitude m and angle theta in radians.
Definition: complex_quda.h:902

quda::abs
__host__ __device__ ValueType abs(ValueType x)
Definition: complex_quda.h:110

quda::operator*
__device__ __host__ ColorSpinor< Float, Nc, Ns > operator*(const S &a, const ColorSpinor< Float, Nc, Ns > &x)
Compute the scalar-vector product y = a * x.
Definition: color_spinor.h:929

quda::complex< double >
Definition: complex_quda.h:554

quda::acos
__host__ __device__ ValueType acos(ValueType x)
Definition: complex_quda.h:50

float
float
Definition: CMakeCUDACompilerId.cpp1.ii:12791

quda::pow
__host__ __device__ complex< float > pow(const float &x, const complex< float > &exponent)
Definition: complex_quda.h:1006

quda::conj
__host__ __device__ ValueType conj(ValueType x)
Definition: complex_quda.h:115

sqrtf
float sqrtf(float)

quda::complex< double >::operator*=
__host__ __device__ complex< double > & operator*=(const complex< double > z)
Definition: complex_quda.h:628

d
static __inline__ size_t size_t d
Definition: CMakeCUDACompilerId.cpp1.ii:3019

hypotf
float hypotf(float, float)

quda::complex< double >::value_type
double value_type
Definition: complex_quda.h:557

quda::operator!=
__host__ __device__ bool operator!=(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:839

quda::atanh
__host__ __device__ complex< ValueType > atanh(const complex< ValueType > &z)
Definition: complex_quda.h:1130

quda::complex< float >::imag
__host__ __device__ float imag() const
Definition: complex_quda.h:540

quda::complex< float >::operator+=
__host__ __device__ complex< float > & operator+=(const complex< float > z)
Definition: complex_quda.h:493

quda::complex< double >::operator=
__host__ __device__ volatile complex< double > & operator=(const complex< T > z) volatile
Definition: complex_quda.h:587

quda::complex< double >::real
__host__ __device__ double real() const volatile
Definition: complex_quda.h:656

quda::complex< float >::real
__host__ __device__ float real() const volatile
Definition: complex_quda.h:537

quda::acosh
__host__ __device__ complex< ValueType > acosh(const complex< ValueType > &z)
Definition: complex_quda.h:1099

quda::operator==
__host__ __device__ bool operator==(const complex< ValueType > &lhs, const complex< ValueType > &rhs)
Definition: complex_quda.h:812

y
int y
Definition: CMakeCUDACompilerId.cpp1.ii:2637

quda::asin
__host__ __device__ ValueType asin(ValueType x)
Definition: complex_quda.h:55

quda::complex< double >::operator+=
__host__ __device__ complex< double > & operator+=(const complex< double > z)
Definition: complex_quda.h:604