v0.9.0/doc/svd__quda_8h_source.html

 #include <float.h>

 #ifndef _SVD_QUDA_H_
 #define _SVD_QUDA_H_

 #define DEVICEHOST __device__ __host__
 #define SVDPREC 1e-11
 #define LOG2 0.69314718055994530942
 #define INVALID_DOUBLE (-DBL_MAX)


 //namespace quda{

 // FIXME replace this with hypot
 template<class Cmplx>
 inline DEVICEHOST
 typename std::remove_reference<decltype(Cmplx::x)>::type cabs(const Cmplx & z)
 {
   typedef typename std::remove_reference<decltype(Cmplx::x)>::type real;
   real max, ratio, square;
   if(fabs(z.x) > fabs(z.y)){ max = z.x; ratio = z.y/max; }else{ max=z.y; ratio = z.x/max; }
   square = (max != 0.0) ? max*max*(1.0 + ratio*ratio) : 0.0;
   return sqrt(square);
 }


 template<class T, class U>
 inline DEVICEHOST typename PromoteTypeId<T,U>::Type quadSum(const T & a, const U & b){
   typename PromoteTypeId<T,U>::Type ratio, square, max;
   if (fabs(a) > fabs(b)) { max = a; ratio = b/a; } else { max=b; ratio = a/b; }
   square = (max != 0.0) ? max*max*(1.0 + ratio*ratio) : 0.0;
   return sqrt(square);
 }


 // In future iterations of the code, I would like to use templates to compute the norm
 DEVICEHOST
 inline float getNorm(const Array<complex<float>,3>& a){
   float temp1, temp2, temp3;
   temp1 = cabs(a[0]);
   temp2 = cabs(a[1]);
   temp3 = quadSum(temp1,temp2);
   temp1 = cabs(a[2]);
   return quadSum(temp1,temp3);
 }


 DEVICEHOST
 inline double getNorm(const Array<complex<double>,3>& a){
   double temp1, temp2, temp3;
   temp1 = cabs(a[0]);
   temp2 = cabs(a[1]);
   temp3 = quadSum(temp1,temp2);
   temp1 = cabs(a[2]);
   return quadSum(temp1,temp3);
 }


 template<class T>
 inline DEVICEHOST
 void constructHHMat(const T & tau, const Array<T,3> & v, Matrix<T,3> & hh)
 {
   Matrix<T,3> temp1, temp2;
   outerProd(v,v,&temp1);

   temp2 = conj(tau)*temp1;

   setIdentity(&temp1);

   hh =  temp1 - temp2;
   return;
 }


 template<class Real>
 inline DEVICEHOST
 void getLambdaMax(const Matrix<Real,3> & b, Real & lambda_max){

   Real m11 = b(1,1)*b(1,1) + b(0,1)*b(0,1);
   Real m22 = b(2,2)*b(2,2) + b(1,2)*b(1,2);
   Real m12 = b(1,1)*b(1,2);
   Real dm  = (m11 - m22) * 0.5;

   Real norm1 = quadSum(dm, m12);
   if( dm >= 0.0 ){
     lambda_max = m22 - (m12*m12)/(norm1 + dm);
   }else{
     lambda_max = m22 + (m12*m12)/(norm1 - dm);
   }
   return;
 }


 template<class Real>
 inline DEVICEHOST
 void getGivensRotation(const Real & alpha, const Real & beta, Real & c, Real & s)
 {
   Real ratio;
   if( beta == 0.0 ){
     c = 1.0; s = 0.0;
   }else if( fabs(beta) > fabs(alpha) ){
     ratio = -alpha/beta;
     s = rsqrt(1.0 + ratio*ratio);
     c = ratio*s;
   }else{
     ratio = -beta/alpha;
     c = rsqrt(1.0 + ratio*ratio);
     s = ratio*c;
   }
   return;
 }

 template<class Real>
 inline DEVICEHOST
 void accumGivensRotation(int index, const Real & c, const Real & s, Matrix<Real,3> & m){
   int index_p1 = index+1;
   Real alpha, beta;
   for(int i=0; i<3; ++i){
     alpha = m(i,index);
     beta  = m(i,index_p1);
     m(i,index) = alpha*c - beta*s;
     m(i,index_p1) = alpha*s + beta*c;
   }
   return;
 }

 template<class Real>
 inline DEVICEHOST
 void assignGivensRotation(const Real & c, const Real & s, Matrix<Real,2> & m){
   m(0,0) = c;
   m(0,1) = s;
   m(1,0) = -s;
   m(1,1) =  c;
   return;
 }

 template<class Real>
 inline DEVICEHOST
 void swap(Real & a, Real & b){
   Real temp = a;
   a = b;
   b = temp;
   return;
 }

 template<class Real>
 inline DEVICEHOST
 void smallSVD(Matrix<Real,2> & u, Matrix<Real,2> & v, Matrix<Real,2> & m){
   // set u and v to the 2x2 identity matrix
   setIdentity(&u);
   setIdentity(&v);

   Real c, s;

   if( m(0,0) == 0.0 ){

     getGivensRotation(m(0,1), m(1,1), c, s);

     m(0,0) = m(0,1)*c - m(1,1)*s;
     m(0,1) = 0.0;
     m(1,1) = 0.0;

     // exchange columns in v
     v(0,0) = 0.0;
     v(0,1) = 1.0;
     v(1,0) = 1.0;
     v(1,1) = 0.0;

     // u is a Givens rotation
     assignGivensRotation(c, s, u);

   }else if( m(1,1) == 0.0 ){

     getGivensRotation(m(0,0), m(0,1), c, s);

     m(0,0) = m(0,0)*c - m(0,1)*s;
     m(0,1) = 0.0;
     m(1,1) = 0.0;

     assignGivensRotation(c,s,v);

   }else if( m(0,1) != 0.0 ){

     // need to calculate (m(1,1)**2 + m(0,1)**2 - m(0,0)**2)/(2*m(0,0)*m(0,1))
     Real abs01 = fabs(m(0,1));
     Real abs11 = fabs(m(1,1));
     Real min, max;
     if( abs01 > abs11 ){ min = abs11; max = abs01; }
     else { min = abs01; max = abs11; }


     Real ratio = min/max;
     Real alpha = 2.0*log(max) + log(1.0 + ratio*ratio);

     Real abs00 = fabs(m(0,0));
     Real beta = 2.0*log(abs00);

     int sign;
     Real temp;

     if( alpha > beta ){
       sign = 1;
       temp = alpha + log(1.0 - exp(beta-alpha));
     }else{
       sign = -1;
       temp = beta + log(1.0 - exp(alpha-beta));
     }
     temp -= LOG2 + log(abs00) + log(abs01);
     temp = sign*exp(temp);

     if( m(0,0) < 0.0 ){ temp *= -1.0; }
     if( m(0,1) < 0.0 ){ temp *= -1.0; }

     beta = (temp >= 0.0) ? quadSum(1.0, temp) : -quadSum(1.0, temp);
     temp = 1.0/(temp + beta);

     // Calculate beta = sqrt(1 + temp**2)
     beta = quadSum(1.0, temp);

     c = 1.0/beta;
     s = temp*c;

     Matrix<Real,2> p;

     p(0,0) = c*m(0,0) - s*m(0,1);
     p(1,0) =          - s*m(1,1);
     p(0,1) = s*m(0,0) + c*m(0,1);
     p(1,1) = c*m(1,1);

     assignGivensRotation(c, s, v);

     // Make the column with the largest norm the first column
     alpha = quadSum(p(0,0),p(1,0));
     beta  = quadSum(p(0,1),p(1,1));

     if(alpha < beta){
       swap(p(0,0),p(0,1));
       swap(p(1,0),p(1,1));

       swap(v(0,0),v(0,1));
       swap(v(1,0),v(1,1));
     }

     getGivensRotation(p(0,0), p(1,0), c, s);

     m(0,0) = p(0,0)*c - s*p(1,0);
     m(1,1) = p(0,1)*s + c*p(1,1);
     m(0,1) = 0.0;

     assignGivensRotation(c,s,u);
   }

   return;
 }

 // Change this so that the bidiagonal terms are not returned
 // as a complex matrix
 template<class Float>
   DEVICEHOST
 void getRealBidiagMatrix(const Matrix<complex<Float>,3> &mat, Matrix<complex<Float>,3> &u, Matrix<complex<Float>,3> &v)
 {
   typedef complex<Float> Complex;

   Matrix<Complex,3> p;
   Array<Complex,3> vec;
   Matrix<Complex,3> temp;


   const Complex COMPLEX_UNITY(1.0,0.0);
   const Complex COMPLEX_ZERO = 0.0;
   // Step 1: build the first left reflector v,
   //        calculate the first left rotation
   //        apply to the original matrix
   Float x = cabs(mat(1,0));
   Float y = cabs(mat(2,0));
   Float norm1 = quadSum(x,y);
   Float beta;
   Complex w, tau, z;

   // Set them to values that would never be set.  If at the end of the
   // below algorithmic flow, these values have been preserved then we
   // know that the input matrix was the unit matrix
   u(0,0).x = INVALID_DOUBLE;
   v(0,0).x = INVALID_DOUBLE;

   if(norm1 == 0 && mat(0,0).y == 0){
     p = mat;
   }else{
     Array<Complex,3> temp_vec;
     copyColumn(mat, 0, &temp_vec);

     beta = (mat(0,0).x > 0.0) ? -getNorm(temp_vec) : getNorm(temp_vec);

     w.x = mat(0,0).x - beta; // work around for LLVM
     w.y = mat(0,0).y;
     Float norm1_inv = 1.0/cabs(w);
     w = conj(w)*norm1_inv;

     // Assign the vector elements
     vec[0] = COMPLEX_UNITY;
     vec[1] = mat(1,0)*w*norm1_inv;
     vec[2] = mat(2,0)*w*norm1_inv;

     // Now compute tau
     tau.x =  (beta - mat(0,0).x)/beta;
     tau.y =  mat(0,0).y/beta;
     // construct the Householder matrix
     constructHHMat(tau, vec, temp);
     p = conj(temp)*mat;
     u = temp;
   }

   // Step 2: build the first right reflector
   Float norm2 = cabs(p(0,2));
   if(norm2 != 0.0 || p(0,1).y != 0.0){
     norm1 = cabs(p(0,1));
     beta  = (p(0,1).x > 0.0) ? -quadSum(norm1,norm2) : quadSum(norm1,norm2);
     vec[0] = COMPLEX_ZERO;
     vec[1] = COMPLEX_UNITY;

     w.x = p(0,1).x-beta; // work around for LLVM
     w.y = p(0,1).y;
     Float norm1_inv = 1.0/cabs(w);
     w = conj(w)*norm1_inv;
     z = conj(p(0,2))*norm1_inv;
     vec[2] = z*conj(w);

     tau.x = (beta - p(0,1).x)/beta; // work around for LLVM
     tau.y = (- p(0,1).y)/beta;
     // construct the Householder matrix
     constructHHMat(tau, vec, temp);
     p = p*temp;
     v = temp;
   }

   // Step 3: build the second left reflector
   norm2 = cabs(p(2,1));
   if(norm2 != 0.0 || p(1,1).y != 0.0){
     norm1 = cabs(p(1,1));
     beta  = (p(1,1).x > 0) ? -quadSum(norm1,norm2) : quadSum(norm1,norm2);

     // Set the first two elements of the vector
     vec[0] = COMPLEX_ZERO;
     vec[1] = COMPLEX_UNITY;

     w.x = p(1,1).x - beta; // work around for LLVM
     w.y = p(1,1).y;
     Float norm1_inv = 1.0/cabs(w);
     w = conj(w)*norm1_inv;
     z = p(2,1)*norm1_inv;
     vec[2] = z*w;

     tau.x  = (beta - p(1,1).x)/beta;
     tau.y  = p(1,1).y/beta;
     // I could very easily change the definition of tau
     // so that we wouldn't need to call conj(temp) below.
     // I would have to be careful to make sure this change
     // is consistent with the other parts of the code.
     constructHHMat(tau, vec, temp);
     p = conj(temp)*p;
     u = u*temp;
   }

   // Step 4: build the second right reflector
   setIdentity(&temp);
   if( p(1,2).y != 0.0 ){
     beta = p(1,2).x > 0.0 ? -cabs(p(1,2)) : cabs(p(1,2));
     temp(2,2) = conj(p(1,2))/beta;
     p(2,2) = p(2,2)*temp(2,2); // This is the only element of p needed below
     v = v*temp;
   }

   // Step 5: build the third left reflector
   if( p(2,2).y != 0.0 ){
     beta = p(2,2).x > 0.0 ? -cabs(p(2,2)) : cabs(p(2,2));
     temp(2,2) = p(2,2)/beta;
     u = u*temp;
   }

   // unit matrix
   if (u(0,0).x == INVALID_DOUBLE && v(0,0).x == INVALID_DOUBLE) {
     u = mat;
     v = mat;
   }

   return;
 }


 template<class Real>
   DEVICEHOST
 void bdSVD(Matrix<Real,3>& u, Matrix<Real,3>& v, Matrix<Real,3>& b, int max_it)
 {

   Real c,s;

   // set u and v matrices equal to the identity
   setIdentity(&u);
   setIdentity(&v);

   Real alpha, beta;

   int it=0;
   do{

     if( fabs(b(0,1)) < SVDPREC*( fabs(b(0,0)) + fabs(b(1,1)) ) ){ b(0,1) = 0.0; }
     if( fabs(b(1,2)) < SVDPREC*( fabs(b(0,0)) + fabs(b(2,2)) ) ){ b(1,2) = 0.0; }

     if( b(0,1) != 0.0 && b(1,2) != 0.0 ){
       if( b(0,0) == 0.0 ){

         getGivensRotation(-b(0,1), b(1,1), s, c);

         for(int i=0; i<3; ++i){
           alpha = u(i,0);
           beta = u(i,1);
           u(i,0) = alpha*c - beta*s;
           u(i,1) = alpha*s + beta*c;
         }

         b(1,1) = b(0,1)*s + b(1,1)*c;
         b(0,1) = 0.0;

         b(0,2) = -b(1,2)*s;
         b(1,2) *= c;

         getGivensRotation(-b(0,2), b(2,2), s, c);

         for(int i=0; i<3; ++i){
           alpha = u(i,0);
           beta = u(i,2);
           u(i,0) = alpha*c - beta*s;
           u(i,2) = alpha*s + beta*c;
         }
         b(2,2) = b(0,2)*s + b(2,2)*c;
         b(0,2) = 0.0;

       }else if( b(1,1) == 0.0 ){
         // same block
         getGivensRotation(-b(1,2), b(2,2), s, c);
         for(int i=0; i<3; ++i){
           alpha = u(i,1);
           beta = u(i,2);
           u(i,1) = alpha*c - beta*s;
           u(i,2) = alpha*s + beta*c;
         }
         b(2,2) = b(1,2)*s + b(2,2)*c;
         b(1,2) = 0.0;
         // end block
       }else if( b(2,2) == 0.0 ){

         getGivensRotation(b(1,1), -b(1,2), c, s);
         for(int i=0; i<3; ++i){
           alpha = v(i,1);
           beta = v(i,2);
           v(i,1) = alpha*c + beta*s;
           v(i,2) = -alpha*s + beta*c;
         }
         b(1,1) = b(1,1)*c + b(1,2)*s;
         b(1,2) = 0.0;

         b(0,2) = -b(0,1)*s;
         b(0,1) *= c;

         // apply second rotation, to remove b02
         getGivensRotation(b(0,0), -b(0,2), c, s);
         for(int i=0; i<3; ++i){
           alpha = v(i,0);
           beta = v(i,2);
           v(i,0) = alpha*c + beta*s;
           v(i,2) = -alpha*s + beta*c;
         }
         b(0,0) = b(0,0)*c + b(0,2)*s;
         b(0,2) = 0.0;

       }else{ // Else entering normal QR iteration

         Real lambda_max;
         getLambdaMax(b, lambda_max); // defined above

         alpha = b(0,0)*b(0,0) - lambda_max;
         beta  = b(0,0)*b(0,1);

         // c*beta + s*alpha = 0
         getGivensRotation(alpha, beta, c, s);
         // Multiply right v matrix
         accumGivensRotation(0, c, s, v);
         // apply to bidiagonal matrix, this generates b(1,0)
         alpha = b(0,0);
         beta  = b(0,1);

         b(0,0) = alpha*c - beta*s;
         b(0,1) = alpha*s + beta*c;
         b(1,0) = -b(1,1)*s;
         b(1,1) = b(1,1)*c;

         // Calculate the second Givens rotation (this time on the left)
         getGivensRotation(b(0,0), b(1,0), c, s);

         // Multiply left u matrix
         accumGivensRotation(0, c, s, u);

         b(0,0) = b(0,0)*c - b(1,0)*s;
         alpha  = b(0,1);
         beta   = b(1,1);
         b(0,1) = alpha*c - beta*s;
         b(1,1) = alpha*s + beta*c;
         b(0,2) = -b(1,2)*s;
         b(1,2) = b(1,2)*c;
         // Following from the definition of the Givens rotation, b(1,0) should be equal to zero.
         b(1,0) = 0.0;

         // Calculate the third Givens rotation (on the right)
         getGivensRotation(b(0,1), b(0,2), c, s);

         // Multiply the right v matrix
         accumGivensRotation(1, c, s, v);

         b(0,1) = b(0,1)*c - b(0,2)*s;
         alpha = b(1,1);
         beta  = b(1,2);

         b(1,1) = alpha*c - beta*s;
         b(1,2) = alpha*s + beta*c;
         b(2,1) = -b(2,2)*s;
         b(2,2) *= c;
         b(0,2) = 0.0;


         // Calculate the fourth Givens rotation (on the left)
         getGivensRotation(b(1,1), b(2,1), c, s);
         // Multiply left u matrix
         accumGivensRotation(1, c, s, u);
         // Eliminate b(2,1)
         b(1,1) = b(1,1)*c - b(2,1)*s;
         alpha = b(1,2);
         beta  = b(2,2);
         b(1,2) = alpha*c - beta*s;
         b(2,2) = alpha*s + beta*c;
         b(2,1) = 0.0;

       } // end of normal QR iteration


     }else if( b(0,1) == 0.0 ){
       Matrix<Real,2> m_small, u_small, v_small;

       m_small(0,0) = b(1,1);
       m_small(0,1) = b(1,2);
       m_small(1,0) = b(2,1);
       m_small(1,1) = b(2,2);

       smallSVD(u_small, v_small, m_small);

       b(1,1) = m_small(0,0);
       b(1,2) = m_small(0,1);
       b(2,1) = m_small(1,0);
       b(2,2) = m_small(1,1);


       for(int i=0; i<3; ++i){
         alpha = u(i,1);
         beta  = u(i,2);
         u(i,1) = alpha*u_small(0,0) + beta*u_small(1,0);
         u(i,2) = alpha*u_small(0,1) + beta*u_small(1,1);

         alpha = v(i,1);
         beta  = v(i,2);
         v(i,1) = alpha*v_small(0,0) + beta*v_small(1,0);
         v(i,2) = alpha*v_small(0,1) + beta*v_small(1,1);
       }


     }else if( b(1,2) == 0.0 ){
       Matrix<Real,2> m_small, u_small, v_small;

       m_small(0,0) = b(0,0);
       m_small(0,1) = b(0,1);
       m_small(1,0) = b(1,0);
       m_small(1,1) = b(1,1);

       smallSVD(u_small, v_small, m_small);

       b(0,0) = m_small(0,0);
       b(0,1) = m_small(0,1);
       b(1,0) = m_small(1,0);
       b(1,1) = m_small(1,1);

       for(int i=0; i<3; ++i){
         alpha = u(i,0);
         beta  = u(i,1);
         u(i,0) = alpha*u_small(0,0) + beta*u_small(1,0);
         u(i,1) = alpha*u_small(0,1) + beta*u_small(1,1);

         alpha = v(i,0);
         beta  = v(i,1);
         v(i,0) = alpha*v_small(0,0) + beta*v_small(1,0);
         v(i,1) = alpha*v_small(0,1) + beta*v_small(1,1);
       }

     } // end if b(1,2) == 0
     it++;
   } while( (b(0,1) != 0.0 || b(1,2) != 0.0) && it < max_it);

   for(int i=0; i<3; ++i){
     if( b(i,i) < 0.0) {
       b(i,i) *= -1;
       for(int j=0; j<3; ++j){
         v(j,i) *= -1;
       }
     }
   }
   return;
 }


 template<class Float>
   DEVICEHOST
 void computeSVD(const Matrix<complex<Float>,3> & m, Matrix<complex<Float>,3>&  u,
     Matrix<complex<Float>,3>& v,  Float singular_values[3])
 {
   getRealBidiagMatrix<Float>(m, u, v);

   Matrix<Float,3> bd, u_real, v_real;
   // Make real
   for(int i=0; i<3; ++i){
     for(int j=0; j<3; ++j){
       bd(i,j) = (conj(u)*m*(v))(i,j).real();
     }
   }

   bdSVD(u_real, v_real, bd, 500);
   for(int i=0; i<3; ++i){
     singular_values[i] = bd(i,i);
   }

   u = u*u_real;
   v = v*v_real;

   return;
 }

 //} // end namespace quda

 #undef INVALID_DOUBLE

 #endif // _SVD_QUDA_H
exp
int exp
Definition: CMakeCUDACompilerId.cpp1.ii:8074

log
double log(double)

conj
Matrix< N, std::complex< T > > conj(const Matrix< N, std::complex< T > > &mat)
Definition: hisq_force_reference2.cpp:231

INVALID_DOUBLE
#define INVALID_DOUBLE
Definition: svd_quda.h:9

quda::Complex
std::complex< double > Complex
Definition: eig_variables.h:13

getGivensRotation
DEVICEHOST void getGivensRotation(const Real &alpha, const Real &beta, Real &c, Real &s)
Definition: svd_quda.h:96

getLambdaMax
DEVICEHOST void getLambdaMax(const Matrix< Real, 3 > &b, Real &lambda_max)
Definition: svd_quda.h:77

z
int int z
Definition: CMakeCUDACompilerId.cpp1.ii:2637

getNorm
DEVICEHOST float getNorm(const Array< complex< float >, 3 > &a)
Definition: svd_quda.h:38

index
char * index(const char *, int)

b
#define b
Definition: dw_dslash4_core.h:83

x
p x
Definition: CMakeCUDACompilerId.cpp1.ii:3011

quda::outerProd
__device__ __host__ void outerProd(const Array< T, N > &a, const Array< T, N > &b, Matrix< T, N > *m)
Definition: quda_matrix.h:695

computeSVD
DEVICEHOST void computeSVD(const Matrix< complex< Float >, 3 > &m, Matrix< complex< Float >, 3 > &u, Matrix< complex< Float >, 3 > &v, Float singular_values[3])
Definition: svd_quda.h:620

smallSVD
DEVICEHOST void smallSVD(Matrix< Real, 2 > &u, Matrix< Real, 2 > &v, Matrix< Real, 2 > &m)
Definition: svd_quda.h:148

cabs
DEVICEHOST std::remove_reference< decltype(Cmplx::x)>::type cabs(const Cmplx &z)
Definition: svd_quda.h:17

DEVICEHOST
#define DEVICEHOST
Definition: svd_quda.h:6

w
int int int w
Definition: CMakeCUDACompilerId.cpp1.ii:2637

p
static __inline__ size_t p
Definition: CMakeCUDACompilerId.cpp1.ii:2995

fused_exterior_ndeg_tm_dslash_cuda_gen.i
int i
start here
Definition: fused_exterior_ndeg_tm_dslash_cuda_gen.py:816

sqrt
double sqrt(double)

quda::copyColumn
__device__ __host__ void copyColumn(const Matrix< T, N > &m, int c, Array< T, N > *a)
Definition: quda_matrix.h:683

norm2
double norm2(Float *v, int len)
Definition: blas_reference.cpp:41

dslash::it
int it
Definition: dslash_quda.cu:64

quda::setIdentity
__device__ __host__ void setIdentity(Matrix< T, N > *m)
Definition: quda_matrix.h:543

getRealBidiagMatrix
DEVICEHOST void getRealBidiagMatrix(const Matrix< complex< Float >, 3 > &mat, Matrix< complex< Float >, 3 > &u, Matrix< complex< Float >, 3 > &v)
Definition: svd_quda.h:260

quadSum
DEVICEHOST PromoteTypeId< T, U >::Type quadSum(const T &a, const U &b)
Definition: svd_quda.h:28

SVDPREC
#define SVDPREC
Definition: svd_quda.h:7

Matrix
Definition: hisq_force_reference2.cpp:131

quda::blas::norm1
double norm1(const ColorSpinorField &b)
Definition: reduce_quda.cu:200

swap
DEVICEHOST void swap(Real &a, Real &b)
Definition: svd_quda.h:139

assignGivensRotation
DEVICEHOST void assignGivensRotation(const Real &c, const Real &s, Matrix< Real, 2 > &m)
Definition: svd_quda.h:129

s
size_t s
Definition: CMakeCUDACompilerId.cpp1.ii:2229

constructHHMat
DEVICEHOST void constructHHMat(const T &tau, const Array< T, 3 > &v, Matrix< T, 3 > &hh)
Definition: svd_quda.h:61

fabs
double fabs(double)

deg_tm_dslash_cuda_gen.sign
def sign(x)
Definition: deg_tm_dslash_cuda_gen.py:104

c
const void * c
Definition: CMakeCUDACompilerId.cpp1.ii:2234

LOG2
#define LOG2
Definition: svd_quda.h:8

bdSVD
DEVICEHOST void bdSVD(Matrix< Real, 3 > &u, Matrix< Real, 3 > &v, Matrix< Real, 3 > &b, int max_it)
Definition: svd_quda.h:392

mat
void mat(void *out, void **link, void *in, int dagger_bit, int mu, QudaPrecision sPrecision, QudaPrecision gPrecision)
Definition: covdev_reference.cpp:117

a
#define a
Definition: dw_dslash4_core.h:82

accumGivensRotation
DEVICEHOST void accumGivensRotation(int index, const Real &c, const Real &s, Matrix< Real, 3 > &m)
Definition: svd_quda.h:115

y
int y
Definition: CMakeCUDACompilerId.cpp1.ii:2637