quda-ref/v1.1.0/quda__arpack__interface_8cpp_source.html

 #include <stdio.h>

 #include <stdlib.h>

 #include <math.h>

 #include <iostream>

 #include <vector>

 #include <algorithm>


 #include <quda_internal.h>

 #include <quda_arpack_interface.h>

 #include <eigensolve_quda.h>

 #include <color_spinor_field.h>

 #include <blas_quda.h>

 #include <util_quda.h>


 // ARPACK INTERAFCE ROUTINES

 //--------------------------------------------------------------------------


 #if (defined(QMP_COMMS) || defined(MPI_COMMS))

 #include <mpi.h>

 #include "mpi_comm_handle.h"

 #endif


 namespace quda

 {


 #ifdef ARPACK_LIB


   void arpackErrorHelpNAUPD();

   void arpackErrorHelpNEUPD();


   void arpack_solve(std::vector<ColorSpinorField *> &h_evecs, std::vector<Complex> &h_evals, const DiracMatrix &mat,

                     QudaEigParam *eig_param, TimeProfile &profile)

   {

     // Create Eigensolver object for member function use

     EigenSolver *eig_solver = EigenSolver::create(eig_param, mat, profile);


     profile.TPSTART(QUDA_PROFILE_INIT);


 // ARPACK logfile name

 #ifdef ARPACK_LOGGING

     char *arpack_logfile = eig_param->arpack_logfile;

 #endif

     if (getVerbosity() >= QUDA_SUMMARIZE) {

       printfQuda("**** START ARPACK SOLUTION ****\n");

 #ifndef ARPACK_LOGGING

       printfQuda("Arpack logging not enabled.\n");

 #else

       printfQuda("Output directed to %s\n", arpack_logfile);

 #endif

     }


     // Construct parameters and memory allocation

     //---------------------------------------------------------------------------------


     // MPI objects

 #if (defined(QMP_COMMS) || defined(MPI_COMMS))

     int *fcomm_ = nullptr;

     MPI_Fint mpi_comm_fort = MPI_Comm_c2f(MPI_COMM_HANDLE);

     fcomm_ = static_cast<int *>(&mpi_comm_fort);

 #endif


     // all FORTRAN communication uses underscored

     int ido_ = 0;

     int info_ = 1; // if 0, use random vector. If 1, initial residual lives in resid_

     int *ipntr_ = (int *)safe_malloc(14 * sizeof(int));

     int *iparam_ = (int *)safe_malloc(11 * sizeof(int));

     int n_ = h_evecs[0]->Volume() * h_evecs[0]->Nspin() * h_evecs[0]->Ncolor();

     int n_ev_ = eig_param->n_ev;

     int n_kr_ = eig_param->n_kr;

     int ldv_ = h_evecs[0]->Volume() * h_evecs[0]->Nspin() * h_evecs[0]->Ncolor();

     int lworkl_ = (3 * n_kr_ * n_kr_ + 5 * n_kr_) * 2;

     int rvec_ = 1;

     int max_iter = eig_param->max_restarts * (n_kr_ - n_ev_) + n_ev_;

     int *h_evals_sorted_idx = (int *)safe_malloc(n_kr_ * sizeof(int));


     // Assign values to ARPACK params

     iparam_[0] = 1;

     iparam_[2] = max_iter;

     iparam_[3] = 1;

     iparam_[6] = 1;


     // ARPACK problem type to be solved

     char howmny = 'P';

     char bmat = 'I';

     char spectrum[3];


     // Part of the spectrum to be computed.

     switch (eig_param->spectrum) {

     case QUDA_SPECTRUM_SR_EIG: strcpy(spectrum, "SR"); break;

     case QUDA_SPECTRUM_LR_EIG: strcpy(spectrum, "LR"); break;

     case QUDA_SPECTRUM_SM_EIG: strcpy(spectrum, "SM"); break;

     case QUDA_SPECTRUM_LM_EIG: strcpy(spectrum, "LM"); break;

     case QUDA_SPECTRUM_SI_EIG: strcpy(spectrum, "SI"); break;

     case QUDA_SPECTRUM_LI_EIG: strcpy(spectrum, "LI"); break;

     default: errorQuda("Unexpected spectrum type %d", eig_param->spectrum);

     }


     bool reverse = false;

     if (strncmp("S", spectrum, 1) == 0 && eig_param->use_poly_acc) {

       // Smallest eig requested by use, largest will requested from ARPACK

       // due to poly acc

       reverse = true;

       spectrum[0] = 'L';

     }


     double tol_ = eig_param->tol;

     double *mod_h_evals_sorted = (double *)safe_malloc(n_kr_ * sizeof(double));


     // ARPACK workspace

     Complex I(0.0, 1.0);

     Complex *resid_ = (Complex *)safe_malloc(ldv_ * sizeof(Complex));


     // Use initial guess?

     if (info_ > 0) {

       for (int a = 0; a < ldv_; a++) resid_[a] = I;

     }


     Complex sigma_ = 0.0;

     Complex *w_workd_ = (Complex *)safe_malloc(3 * ldv_ * sizeof(Complex));

     Complex *w_workl_ = (Complex *)safe_malloc(lworkl_ * sizeof(Complex));

     Complex *w_workev_ = (Complex *)safe_malloc(2 * n_kr_ * sizeof(Complex));

     double *w_rwork_ = (double *)safe_malloc(n_kr_ * sizeof(double));

     int *select_ = (int *)safe_malloc(n_kr_ * sizeof(int));


     Complex *h_evecs_ = (Complex *)safe_malloc(n_kr_ * ldv_ * sizeof(Complex));

     Complex *h_evals_ = (Complex *)safe_malloc(n_ev_ * sizeof(Complex));

     std::vector<ColorSpinorField *> h_evecs_arpack;


     for (int i = 0; i < n_kr_; i++) {

       // create container wrapping the vectors returned from ARPACK

       ColorSpinorParam param(*h_evecs[0]);

       param.fieldOrder = QUDA_SPACE_SPIN_COLOR_FIELD_ORDER;

       param.location = QUDA_CPU_FIELD_LOCATION;

       param.create = QUDA_REFERENCE_FIELD_CREATE;

       param.gammaBasis = QUDA_UKQCD_GAMMA_BASIS;

       param.v = (Complex *)h_evecs_ + i * ldv_;

       h_evecs_arpack.push_back(ColorSpinorField::Create(param));

     }


     int iter_count = 0;


     bool allocate = true;

     ColorSpinorField *h_v = nullptr;

     ColorSpinorField *d_v = nullptr;

     ColorSpinorField *h_v2 = nullptr;

     ColorSpinorField *d_v2 = nullptr;

     ColorSpinorField *resid = nullptr;


 #ifdef ARPACK_LOGGING

     // ARPACK log routines

     // Code added to print the log of ARPACK

     int arpack_log_u = 9999;


 #if (defined(QMP_COMMS) || defined(MPI_COMMS))

     if (arpack_logfile != NULL && (comm_rank() == 0)) {

       ARPACK(initlog)(&arpack_log_u, arpack_logfile, strlen(arpack_logfile));

       int msglvl0 = 9, msglvl3 = 9;

       ARPACK(pmcinitdebug)

       (&arpack_log_u, // logfil

        &msglvl3,      // mcaupd

        &msglvl3,      // mcaup2

        &msglvl0,      // mcaitr

        &msglvl3,      // mceigh

        &msglvl0,      // mcapps

        &msglvl0,      // mcgets

        &msglvl3       // mceupd

       );

       if (getVerbosity() >= QUDA_SUMMARIZE) {

         printfQuda("eigenSolver: Log info:\n");

         printfQuda("ARPACK verbosity set to mcaup2=3 mcaupd=3 mceupd=3; \n");

         printfQuda("output is directed to %s\n", arpack_logfile);

       }

     }

 #else

     if (arpack_logfile != NULL) {

       ARPACK(initlog)(&arpack_log_u, arpack_logfile, strlen(arpack_logfile));

       int msglvl0 = 9, msglvl3 = 9;

       ARPACK(mcinitdebug)

       (&arpack_log_u, // logfil

        &msglvl3,      // mcaupd

        &msglvl3,      // mcaup2

        &msglvl0,      // mcaitr

        &msglvl3,      // mceigh

        &msglvl0,      // mcapps

        &msglvl0,      // mcgets

        &msglvl3       // mceupd

       );

       if (getVerbosity() >= QUDA_SUMMARIZE) {

         printfQuda("eigenSolver: Log info:\n");

         printfQuda("ARPACK verbosity set to mcaup2=3 mcaupd=3 mceupd=3; \n");

         printfQuda("output is directed to %s\n", arpack_logfile);

       }

     }


 #endif

 #endif


     profile.TPSTOP(QUDA_PROFILE_INIT);


     // Start ARPACK routines

     //---------------------------------------------------------------------------------


     do {


       profile.TPSTART(QUDA_PROFILE_ARPACK);


       // Interface to arpack routines

       //----------------------------

 #if (defined(QMP_COMMS) || defined(MPI_COMMS))

       ARPACK(pznaupd)

       (fcomm_, &ido_, &bmat, &n_, spectrum, &n_ev_, &tol_, resid_, &n_kr_, h_evecs_, &n_, iparam_, ipntr_, w_workd_,

        w_workl_, &lworkl_, w_rwork_, &info_, 1, 2);


       if (info_ != 0) {

         arpackErrorHelpNAUPD();

         errorQuda("\nError in pznaupd info = %d. Exiting.", info_);

       }

 #else

       ARPACK(znaupd)

       (&ido_, &bmat, &n_, spectrum, &n_ev_, &tol_, resid_, &n_kr_, h_evecs_, &n_, iparam_, ipntr_, w_workd_, w_workl_,

        &lworkl_, w_rwork_, &info_, 1, 2);

       if (info_ != 0) {

         arpackErrorHelpNAUPD();

         errorQuda("\nError in znaupd info = %d. Exiting.", info_);

       }

 #endif


       profile.TPSTOP(QUDA_PROFILE_ARPACK);


       // If this is the first iteration, we allocate CPU and GPU memory for QUDA

       if (allocate) {

         ColorSpinorParam param(*h_evecs[0]);

         param.fieldOrder = QUDA_SPACE_SPIN_COLOR_FIELD_ORDER;

         param.location = QUDA_CPU_FIELD_LOCATION;

         param.create = QUDA_REFERENCE_FIELD_CREATE;

         param.gammaBasis = QUDA_UKQCD_GAMMA_BASIS;


         // Fortran arrays start at 1. The C++ pointer is therefore the Fortran pointer

         // less one, hence ipntr[0] - 1 to specify the correct address.

         param.v = w_workd_ + (ipntr_[0] - 1);

         h_v = ColorSpinorField::Create(param);

         // Adjust the position of the start of the array.

         param.v = w_workd_ + (ipntr_[1] - 1);

         h_v2 = ColorSpinorField::Create(param);


         // create device field temporaries

         param.location = QUDA_CUDA_FIELD_LOCATION;

         param.create = QUDA_ZERO_FIELD_CREATE;

         param.setPrecision(param.Precision(), param.Precision(), true);


         d_v = ColorSpinorField::Create(param);

         d_v2 = ColorSpinorField::Create(param);

         resid = ColorSpinorField::Create(param);

         allocate = false;

       }


       if (ido_ == 99 || info_ == 1) break;


       if (ido_ == -1 || ido_ == 1) {


         profile.TPSTART(QUDA_PROFILE_D2H);


         *d_v = *h_v;


         profile.TPSTOP(QUDA_PROFILE_D2H);

         profile.TPSTART(QUDA_PROFILE_COMPUTE);


         // apply matrix-vector operation here:

         eig_solver->chebyOp(mat, *d_v2, *d_v);


         profile.TPSTOP(QUDA_PROFILE_COMPUTE);

         profile.TPSTART(QUDA_PROFILE_H2D);


         *h_v2 = *d_v2;


         profile.TPSTOP(QUDA_PROFILE_H2D);

       }


       if (getVerbosity() >= QUDA_VERBOSE)

         printfQuda("Arpack Iteration %s: %d\n", eig_param->use_poly_acc ? "(with poly acc) " : "", iter_count);

       iter_count++;


     } while (99 != ido_ && iter_count < max_iter);


     // Subspace calulated sucessfully. Compute n_ev eigenvectors and values


     if (getVerbosity() >= QUDA_SUMMARIZE) {

       printfQuda("Finish: iter=%04d  info=%d  ido=%d\n", iter_count, info_, ido_);

       printfQuda("Computing eigenvectors\n");

     }


     profile.TPSTART(QUDA_PROFILE_ARPACK);


     // Interface to arpack routines

     //----------------------------

 #if (defined(QMP_COMMS) || defined(MPI_COMMS))

     ARPACK(pzneupd)

     (fcomm_, &rvec_, &howmny, select_, h_evals_, h_evecs_, &n_, &sigma_, w_workev_, &bmat, &n_, spectrum, &n_ev_, &tol_,

      resid_, &n_kr_, h_evecs_, &n_, iparam_, ipntr_, w_workd_, w_workl_, &lworkl_, w_rwork_, &info_, 1, 1, 2);

     if (info_ == -15) {

       arpackErrorHelpNEUPD();

       errorQuda("\nError in pzneupd info = %d. You likely need to\n"

                 "increase the maximum ARPACK iterations. Exiting.",

                 info_);

     } else if (info_ != 0) {

       arpackErrorHelpNEUPD();

       errorQuda("\nError in pzneupd info = %d. Exiting.", info_);

     }

 #else

     ARPACK(zneupd)

     (&rvec_, &howmny, select_, h_evals_, h_evecs_, &n_, &sigma_, w_workev_, &bmat, &n_, spectrum, &n_ev_, &tol_, resid_,

      &n_kr_, h_evecs_, &n_, iparam_, ipntr_, w_workd_, w_workl_, &lworkl_, w_rwork_, &info_, 1, 1, 2);

     if (info_ == -15) {

       arpackErrorHelpNEUPD();

       errorQuda("\nError in zneupd info = %d. You likely need to\n"

                 "increase the maximum ARPACK iterations. Exiting.",

                 info_);

     } else if (info_ != 0) {

       arpackErrorHelpNEUPD();

       errorQuda("\nError in zneupd info = %d. Exiting.", info_);

     }

 #endif


     profile.TPSTOP(QUDA_PROFILE_ARPACK);


     // Print additional convergence information.

     if ((info_) == 1) {

       if (getVerbosity() >= QUDA_SUMMARIZE) printfQuda("Maximum number of iterations reached.\n");

     } else {

       if (info_ == 3) {

         errorQuda("ARPACK Error: No shifts could be applied during implicit\n");

         errorQuda("Arnoldi update.\n");

       }

     }

 #ifdef ARPACK_LOGGING

 #if (defined(QMP_COMMS) || defined(MPI_COMMS))

     if (comm_rank() == 0) {

       if (arpack_logfile != NULL) { ARPACK(finilog)(&arpack_log_u); }

     }

 #else

     if (arpack_logfile != NULL) ARPACK(finilog)(&arpack_log_u);

 #endif

 #endif


     if (getVerbosity() >= QUDA_SUMMARIZE) printfQuda("Checking eigenvalues\n");


     int nconv = iparam_[4];


     // Sort the eigenvalues in absolute ascending order

     std::vector<std::pair<double, int>> evals_sorted;

     for (int j = 0; j < nconv; j++) { evals_sorted.push_back(std::make_pair(h_evals_[j].real(), j)); }


     // Sort the array by value (first in the pair)

     // and the index (second in the pair) will come along

     // for the ride.

     std::sort(evals_sorted.begin(), evals_sorted.end());

     if (reverse) std::reverse(evals_sorted.begin(), evals_sorted.end());


     // print out the computed Ritz values and their error estimates

     for (int j = 0; j < nconv; j++) {

       if (getVerbosity() >= QUDA_SUMMARIZE)

         printfQuda("RitzValue[%04d] = %+.16e %+.16e Residual: %+.16e\n", j, real(h_evals_[evals_sorted[j].second]),

                    imag(h_evals_[evals_sorted[j].second]),

                    std::abs(*(w_workl_ + ipntr_[10] - 1 + evals_sorted[j].second)));

     }


     // Compute Eigenvalues from Eigenvectors.

     for (int i = 0; i < nconv; i++) {

       int idx = evals_sorted[i].second;


       profile.TPSTART(QUDA_PROFILE_D2H);

       *d_v = *h_evecs_arpack[idx];

       profile.TPSTOP(QUDA_PROFILE_D2H);


       profile.TPSTART(QUDA_PROFILE_COMPUTE);

       // d_v2 = M*v

       eig_solver->matVec(mat, *d_v2, *d_v);


       // lambda = v^dag * M*v

       h_evals_[idx] = blas::cDotProduct(*d_v, *d_v2);


       Complex unit(1.0, 0.0);

       Complex m_lambda(-h_evals_[idx]);


       // d_v = ||M*v - lambda*v||

       blas::caxpby(unit, *d_v2, m_lambda, *d_v);

       double L2norm = blas::norm2(*d_v);


       profile.TPSTOP(QUDA_PROFILE_COMPUTE);


       if (getVerbosity() >= QUDA_SUMMARIZE)

         printfQuda("EigValue[%04d] = %+.16e  %+.16e  Residual: %.16e\n", i, real(h_evals_[idx]), imag(h_evals_[idx]),

                    sqrt(L2norm));

     }


     // copy back eigenvalues using the sorting index

     for (int i = 0; i < nconv; i++) h_evals[i] = h_evals_[evals_sorted[i].second];


     // copy back eigenvectors using the sorting index

     for (int i = 0; i < nconv; i++) *h_evecs[i] = *h_evecs_arpack[evals_sorted[i].second];


     profile.TPSTART(QUDA_PROFILE_FREE);


     // cleanup

     host_free(h_evals_);

     for (int i = 0; i < n_kr_; i++) delete h_evecs_arpack[i];

     host_free(h_evecs_);

     host_free(ipntr_);

     host_free(iparam_);

     host_free(mod_h_evals_sorted);

     host_free(h_evals_sorted_idx);

     host_free(resid_);

     host_free(w_workd_);

     host_free(w_workl_);

     host_free(w_workev_);

     host_free(w_rwork_);

     host_free(select_);


     delete h_v;

     delete h_v2;

     delete d_v;

     delete d_v2;

     delete resid;

     delete eig_solver;


     profile.TPSTOP(QUDA_PROFILE_FREE);

   }


   void arpackErrorHelpNAUPD()

   {

     printfQuda("Error help NAUPD\n");

     printfQuda("INFO Integer.  (INPUT/OUTPUT)\n");

     printfQuda("     If INFO .EQ. 0, a randomly initial residual vector is used.\n");

     printfQuda("     If INFO .NE. 0, RESID contains the initial residual vector,\n");

     printfQuda("                        possibly from a previous run.\n");

     printfQuda("     Error flag on output.\n");

     printfQuda("     =  0: Normal exit.\n");

     printfQuda("     =  1: Maximum number of iterations taken.\n");

     printfQuda("        All possible eigenvalues of OP has been found. IPARAM(5)\n");

     printfQuda("        returns the number of wanted converged Ritz values.\n");

     printfQuda("     =  2: No longer an informational error. Deprecated starting\n");

     printfQuda("        with release 2 of ARPACK.\n");

     printfQuda("     =  3: No shifts could be applied during a cycle of the\n");

     printfQuda("        Implicitly restarted Arnoldi iteration. One possibility\n");

     printfQuda("        is to increase the size of NCV relative to NEV.\n");

     printfQuda("        See remark 4 below.\n");

     printfQuda("     = -1: N must be positive.\n");

     printfQuda("     = -2: NEV must be positive.\n");

     printfQuda("     = -3: NCV-NEV >= 1 and less than or equal to N.\n");

     printfQuda("     = -4: The maximum number of Arnoldi update iteration\n");

     printfQuda("        must be greater than zero.\n");

     printfQuda("     = -5: WHICH must be 'LM', 'SM', 'LR', 'SR', 'LI', 'SI'\n");

     printfQuda("     = -6: BMAT must be one of 'I' or 'G'.\n");

     printfQuda("     = -7: Length of private work array is not sufficient.\n");

     printfQuda("     = -8: Error return from LAPACK eigenvalue calculation;\n");

     printfQuda("     = -9: Starting vector is zero.\n");

     printfQuda("     = -10: IPARAM(7) must be 1,2,3.\n");

     printfQuda("     = -11: IPARAM(7) = 1 and BMAT = 'G' are incompatible.\n");

     printfQuda("     = -12: IPARAM(1) must be equal to 0 or 1.\n");

     printfQuda("     = -9999: Could not build an Arnoldi factorization.\n");

     printfQuda("        User input error highly likely.  Please\n");

     printfQuda("        check actual array dimensions and layout.\n");

     printfQuda("        IPARAM(5) returns the size of the current Arnoldi\n");

     printfQuda("        factorization.\n");

   }


   void arpackErrorHelpNEUPD()

   {

     printfQuda("Error help NEUPD\n");

     printfQuda("INFO Integer.  (OUTPUT)\n");

     printfQuda("     Error flag on output.\n");

     printfQuda("     =  0: Normal exit.\n");

     printfQuda("     =  1: The Schur form computed by LAPACK routine csheqr\n");

     printfQuda("        could not be reordered by LAPACK routine ztrsen.\n");

     printfQuda("        Re-enter subroutine zneupd with IPARAM(5)=NCV and\n");

     printfQuda("        increase the size of the array D to have\n");

     printfQuda("        dimension at least dimension NCV and allocate at\n");

     printfQuda("        least NCV\n");

     printfQuda("        columns for Z. NOTE: Not necessary if Z and V share\n");

     printfQuda("        the same space. Please notify the authors if this\n");

     printfQuda("        error occurs.\n");

     printfQuda("     = -1: N must be positive.\n");

     printfQuda("     = -2: NEV must be positive.\n");

     printfQuda("     = -3: NCV-NEV >= 1 and less than or equal to N.\n");

     printfQuda("     = -5: WHICH must be 'LM', 'SM', 'LR', 'SR', 'LI', 'SI'\n");

     printfQuda("     = -6: BMAT must be one of 'I' or 'G'.\n");

     printfQuda("     = -7: Length of private work WORKL array is inufficient.\n");

     printfQuda("     = -8: Error return from LAPACK eigenvalue calculation.\n");

     printfQuda("        This should never happened.\n");

     printfQuda("     = -9: Error return from calculation of eigenvectors.\n");

     printfQuda("        Informational error from LAPACK routine ztrevc.\n");

     printfQuda("     = -10: IPARAM(7) must be 1,2,3\n");

     printfQuda("     = -11: IPARAM(7) = 1 and BMAT = 'G' are incompatible.\n");

     printfQuda("     = -12: HOWMNY = 'S' not yet implemented\n");

     printfQuda("     = -13: HOWMNY must be one of 'A' or 'P' if RVEC = .true.\n");

     printfQuda("     = -14: ZNAUPD did not find any eigenvalues to sufficient\n");

     printfQuda("        accuracy.\n");

     printfQuda("     = -15: ZNEUPD got a different count of the number of\n");

     printfQuda("        converged Ritz values than ZNAUPD got. This\n");

     printfQuda("        indicates the user probably made an error in\n");

     printfQuda("        passing data from ZNAUPD to ZNEUPD or that the\n");

     printfQuda("        data was modified before entering ZNEUPD\n");

   }


 #else


   void arpack_solve(std::vector<ColorSpinorField *> &h_evecs, std::vector<Complex> &h_evals, const DiracMatrix &mat,

                     QudaEigParam *eig_param, TimeProfile &profile)

   {

     errorQuda("(P)ARPACK has not been enabled for this build");

   }

 #endif


 } // namespace quda

blas_quda.h

quda::ColorSpinorField::Create
static ColorSpinorField * Create(const ColorSpinorParam &param)
Definition: color_spinor_field.cpp:714

quda::DiracMatrix
Definition: dirac_quda.h:1892

quda::EigenSolver::create
static EigenSolver * create(QudaEigParam *eig_param, const DiracMatrix &mat, TimeProfile &profile)
Creates the eigensolver using the parameters given and the matrix.
Definition: eigensolve_quda.cpp:97

quda::TimeProfile
Definition: timer.h:174

color_spinor_field.h

comm_rank
int comm_rank(void)
Definition: communicator_stack.cpp:87

mat
void mat(void *out, void **link, void *in, int dagger_bit, int mu, QudaPrecision sPrecision, QudaPrecision gPrecision)
Definition: covdev_reference.cpp:109

eigensolve_quda.h

QUDA_CUDA_FIELD_LOCATION
@ QUDA_CUDA_FIELD_LOCATION
Definition: enum_quda.h:326

QUDA_CPU_FIELD_LOCATION
@ QUDA_CPU_FIELD_LOCATION
Definition: enum_quda.h:325

QUDA_SUMMARIZE
@ QUDA_SUMMARIZE
Definition: enum_quda.h:266

QUDA_VERBOSE
@ QUDA_VERBOSE
Definition: enum_quda.h:267

QUDA_UKQCD_GAMMA_BASIS
@ QUDA_UKQCD_GAMMA_BASIS
Definition: enum_quda.h:369

QUDA_SPECTRUM_LM_EIG
@ QUDA_SPECTRUM_LM_EIG
Definition: enum_quda.h:147

QUDA_SPECTRUM_SM_EIG
@ QUDA_SPECTRUM_SM_EIG
Definition: enum_quda.h:148

QUDA_SPECTRUM_LR_EIG
@ QUDA_SPECTRUM_LR_EIG
Definition: enum_quda.h:149

QUDA_SPECTRUM_SR_EIG
@ QUDA_SPECTRUM_SR_EIG
Definition: enum_quda.h:150

QUDA_SPECTRUM_SI_EIG
@ QUDA_SPECTRUM_SI_EIG
Definition: enum_quda.h:152

QUDA_SPECTRUM_LI_EIG
@ QUDA_SPECTRUM_LI_EIG
Definition: enum_quda.h:151

QUDA_SPACE_SPIN_COLOR_FIELD_ORDER
@ QUDA_SPACE_SPIN_COLOR_FIELD_ORDER
Definition: enum_quda.h:351

QUDA_ZERO_FIELD_CREATE
@ QUDA_ZERO_FIELD_CREATE
Definition: enum_quda.h:361

QUDA_REFERENCE_FIELD_CREATE
@ QUDA_REFERENCE_FIELD_CREATE
Definition: enum_quda.h:363

safe_malloc
#define safe_malloc(size)
Definition: malloc_quda.h:106

host_free
#define host_free(ptr)
Definition: malloc_quda.h:115

mpi_comm_handle.h

quda::blas::caxpby
void caxpby(const Complex &a, ColorSpinorField &x, const Complex &b, ColorSpinorField &y)

quda::blas::norm2
double norm2(const ColorSpinorField &a)

quda::blas::cDotProduct
Complex cDotProduct(ColorSpinorField &, ColorSpinorField &)

quda
Definition: blas_lapack.h:24

quda::arpack_solve
void arpack_solve(std::vector< ColorSpinorField * > &h_evecs, std::vector< Complex > &h_evals, const DiracMatrix &mat, QudaEigParam *eig_param, TimeProfile &profile)
The QUDA interface function. One passes two allocated arrays to hold the the eigenmode data,...
Definition: quda_arpack_interface.cpp:507

quda::Complex
std::complex< double > Complex
Definition: quda_internal.h:86

quda::sqrt
__host__ __device__ ValueType sqrt(ValueType x)
Definition: complex_quda.h:120

quda::QUDA_PROFILE_INIT
@ QUDA_PROFILE_INIT
Definition: timer.h:106

quda::QUDA_PROFILE_COMPUTE
@ QUDA_PROFILE_COMPUTE
Definition: timer.h:108

quda::QUDA_PROFILE_ARPACK
@ QUDA_PROFILE_ARPACK
Definition: timer.h:118

quda::QUDA_PROFILE_FREE
@ QUDA_PROFILE_FREE
Definition: timer.h:111

quda::QUDA_PROFILE_H2D
@ QUDA_PROFILE_H2D
Definition: timer.h:104

quda::QUDA_PROFILE_D2H
@ QUDA_PROFILE_D2H
Definition: timer.h:105

quda::abs
__host__ __device__ ValueType abs(ValueType x)
Definition: complex_quda.h:125

param
QudaGaugeParam param
Definition: pack_test.cpp:18

quda_arpack_interface.h

quda_internal.h

QudaEigParam_s
Definition: quda.h:406

QudaEigParam_s::spectrum
QudaEigSpectrumType spectrum
Definition: quda.h:466

QudaEigParam_s::use_poly_acc
QudaBoolean use_poly_acc
Definition: quda.h:419

QudaEigParam_s::tol
double tol
Definition: quda.h:479

QudaEigParam_s::arpack_logfile
char arpack_logfile[512]
Definition: quda.h:494

QudaEigParam_s::n_ev
int n_ev
Definition: quda.h:469

QudaEigParam_s::max_restarts
int max_restarts
Definition: quda.h:485

QudaEigParam_s::n_kr
int n_kr
Definition: quda.h:471

QudaGaugeParam_s::location
QudaFieldLocation location
Definition: quda.h:33

util_quda.h

printfQuda
#define printfQuda(...)
Definition: util_quda.h:114

getVerbosity
QudaVerbosity getVerbosity()
Definition: util_quda.cpp:21

errorQuda
#define errorQuda(...)
Definition: util_quda.h:120