quda-ref/v1.1.0/clover__field_8cpp_source.html

 #include <stdlib.h>

 #include <stdio.h>

 #include <string.h>

 #include <math.h>

 #include <typeinfo>


 #include <quda_internal.h>

 #include <clover_field.h>

 #include <gauge_field.h>

 #include <color_spinor_field.h>

 #include <blas_quda.h>


 namespace quda {


   CloverFieldParam::CloverFieldParam(const CloverField &a) :

     LatticeFieldParam(a),

     direct(a.V(false)),

     inverse(a.V(true)),

     clover(nullptr),

     norm(nullptr),

     cloverInv(nullptr),

     invNorm(nullptr),

     csw(a.Csw()),

     coeff(a.Coeff()),

     twisted(a.Twisted()),

     mu2(a.Mu2()),

     rho(a.Rho()),

     order(a.Order()),

     create(QUDA_NULL_FIELD_CREATE),

     location(a.Location())

   {

     precision = a.Precision();

     nDim = a.Ndim();

     pad = a.Pad();

     siteSubset = QUDA_FULL_SITE_SUBSET;

     for (int dir = 0; dir < nDim; ++dir) x[dir] = a.X()[dir];

   }


   CloverField::CloverField(const CloverFieldParam &param) :

     LatticeField(param), bytes(0), norm_bytes(0), nColor(3), nSpin(4),

     clover(0), norm(0), cloverInv(0), invNorm(0), csw(param.csw), coeff(param.coeff),

     rho(param.rho), order(param.order), create(param.create), trlog{0, 0}

   {

     if (nDim != 4) errorQuda("Number of dimensions must be 4, not %d", nDim);


     if (order == QUDA_QDPJIT_CLOVER_ORDER && create != QUDA_REFERENCE_FIELD_CREATE)

       errorQuda("QDPJIT ordered clover fields only supported for reference fields");


     real_length = 2 * ((size_t)volumeCB) * nColor * nColor * nSpin * nSpin / 2; // block-diagonal Hermitian (72 reals)

     length = 2 * ((size_t)stride) * nColor * nColor * nSpin * nSpin / 2;


     bytes = length * precision;

     if (isNative()) bytes = 2*ALIGNMENT_ADJUST(bytes/2);

     if (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION) {

       norm_bytes = sizeof(float)*2*stride*2; // 2 chirality

       if (isNative()) norm_bytes = 2*ALIGNMENT_ADJUST(norm_bytes/2);

     }

 //for twisted mass only:

     twisted = false;//param.twisted;

     mu2 = 0.0; //param.mu2;

   }


   CloverField::~CloverField() { }


   CloverField *CloverField::Create(const CloverFieldParam &param)

   {


     CloverField *field = nullptr;

     if (param.location == QUDA_CPU_FIELD_LOCATION) {

       field = new cpuCloverField(param);

     } else if (param.location == QUDA_CUDA_FIELD_LOCATION) {

       field = new cudaCloverField(param);

     } else {

       errorQuda("Invalid field location %d", param.location);

     }


     return field;

   }


   void CloverField::setRho(double rho_)

   {

     rho = rho_;

   }


   cudaCloverField::cudaCloverField(const CloverFieldParam &param) : CloverField(param) {


     if (create != QUDA_NULL_FIELD_CREATE && create != QUDA_REFERENCE_FIELD_CREATE)

       errorQuda("Create type %d not supported", create);


     if (param.direct) {

       if (create != QUDA_REFERENCE_FIELD_CREATE) {

         clover = bytes ? pool_device_malloc(bytes) : nullptr;

         if (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION)

           norm = norm_bytes ? pool_device_malloc(norm_bytes) : nullptr;

       } else {

         clover = param.clover;

         norm = param.norm;

       }


       even = clover;

       odd = static_cast<char*>(clover) + bytes/2;


       evenNorm = norm;

       oddNorm = static_cast<char*>(norm) + norm_bytes/2;


       total_bytes += bytes + norm_bytes;


       // this is a hack to prevent us allocating a texture object for an unallocated inverse field

       if (!param.inverse) {

         cloverInv = clover;

         evenInv = even;

         oddInv = odd;

         invNorm = norm;

         evenInvNorm = evenNorm;

         oddInvNorm = oddNorm;

       }

     }


     if (param.inverse) {

       if (create != QUDA_REFERENCE_FIELD_CREATE) {

         cloverInv = bytes ? pool_device_malloc(bytes) : nullptr;

         if (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION)

           invNorm = norm_bytes ? pool_device_malloc(norm_bytes) : nullptr;

       } else {

         cloverInv = param.cloverInv;

         invNorm = param.invNorm;

       }


       evenInv = cloverInv;

       oddInv = static_cast<char*>(cloverInv) + bytes/2;


       evenInvNorm = invNorm;

       oddInvNorm = static_cast<char*>(invNorm) + norm_bytes/2;


       total_bytes += bytes + norm_bytes;


       // this is a hack to ensure that we can autotune the clover

       // operator when just using symmetric preconditioning

       if (!param.direct) {

         clover = cloverInv;

         even = evenInv;

         odd = oddInv;

         norm = invNorm;

         evenNorm = evenInvNorm;

         oddNorm = oddInvNorm;

       }

     }


     if (!param.inverse) {

       cloverInv = clover;

       evenInv = even;

       oddInv = odd;

       invNorm = norm;

       evenInvNorm = evenNorm;

       oddInvNorm = oddNorm;

     }


     twisted = param.twisted;

     mu2 = param.mu2;

   }


   cudaCloverField::~cudaCloverField()

   {

     if (create != QUDA_REFERENCE_FIELD_CREATE) {

       if (clover != cloverInv) {

         if (clover) pool_device_free(clover);

         if (norm) pool_device_free(norm);

       }

       if (cloverInv) pool_device_free(cloverInv);

       if (invNorm) pool_device_free(invNorm);

     }

   }


   void cudaCloverField::copy(const CloverField &src, bool inverse) {


     checkField(src);


     if (typeid(src) == typeid(cudaCloverField)) {

       if (src.V(false)) copyGenericClover(*this, src, false, QUDA_CUDA_FIELD_LOCATION);

       if (src.V(true)) copyGenericClover(*this, src, true, QUDA_CUDA_FIELD_LOCATION);

     } else if (reorder_location() == QUDA_CPU_FIELD_LOCATION && typeid(src) == typeid(cpuCloverField)) {

       void *packClover = pool_pinned_malloc(bytes + norm_bytes);

       void *packCloverNorm = (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION) ?

           static_cast<char *>(packClover) + bytes :

           0;


       if (src.V(false)) {

         copyGenericClover(*this, src, false, QUDA_CPU_FIELD_LOCATION, packClover, 0, packCloverNorm, 0);

         qudaMemcpy(clover, packClover, bytes, cudaMemcpyHostToDevice);

         if (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION)

           qudaMemcpy(norm, packCloverNorm, norm_bytes, cudaMemcpyHostToDevice);

       }


       if (src.V(true) && inverse) {

         copyGenericClover(*this, src, true, QUDA_CPU_FIELD_LOCATION, packClover, 0, packCloverNorm, 0);

         qudaMemcpy(cloverInv, packClover, bytes, cudaMemcpyHostToDevice);

         if (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION)

           qudaMemcpy(invNorm, packCloverNorm, norm_bytes, cudaMemcpyHostToDevice);

       }


       pool_pinned_free(packClover);

     } else if (reorder_location() == QUDA_CUDA_FIELD_LOCATION && typeid(src) == typeid(cpuCloverField)) {

       void *packClover = pool_device_malloc(src.Bytes() + src.NormBytes());

       void *packCloverNorm = (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION) ?

           static_cast<char *>(packClover) + src.Bytes() :

           0;


       if (src.V(false)) {

         qudaMemcpy(packClover, src.V(false), src.Bytes(), cudaMemcpyHostToDevice);

         if (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION)

           qudaMemcpy(packCloverNorm, src.Norm(false), src.NormBytes(), cudaMemcpyHostToDevice);


         copyGenericClover(*this, src, false, QUDA_CUDA_FIELD_LOCATION, 0, packClover, 0, packCloverNorm);

       }


       if (src.V(true) && inverse) {

         qudaMemcpy(packClover, src.V(true), src.Bytes(), cudaMemcpyHostToDevice);

         if (precision == QUDA_HALF_PRECISION || precision == QUDA_QUARTER_PRECISION)

           qudaMemcpy(packCloverNorm, src.Norm(true), src.NormBytes(), cudaMemcpyHostToDevice);


         copyGenericClover(*this, src, true, QUDA_CUDA_FIELD_LOCATION, 0, packClover, 0, packCloverNorm);

       }


       pool_device_free(packClover);

     } else {

       errorQuda("Invalid clover field type");

     }


     qudaDeviceSynchronize();

   }


   void cudaCloverField::loadCPUField(const cpuCloverField &cpu) { copy(cpu); }


   void cudaCloverField::saveCPUField(cpuCloverField &cpu) const {

     checkField(cpu);


     // we know we are copying from GPU to CPU here, so for now just

     // assume that reordering is on CPU

     void *packClover = pool_pinned_malloc(bytes + norm_bytes);

     void *packCloverNorm = (precision == QUDA_HALF_PRECISION) ? static_cast<char*>(packClover) + bytes : 0;


     // first copy over the direct part (if it exists)

     if (V(false) && cpu.V(false)) {

       qudaMemcpy(packClover, clover, bytes, cudaMemcpyDeviceToHost);

       if (precision == QUDA_HALF_PRECISION)

         qudaMemcpy(packCloverNorm, norm, norm_bytes, cudaMemcpyDeviceToHost);

       copyGenericClover(cpu, *this, false, QUDA_CPU_FIELD_LOCATION, 0, packClover, 0, packCloverNorm);

     } else if((V(false) && !cpu.V(false)) || (!V(false) && cpu.V(false))) {

       errorQuda("Mismatch between Clover field GPU V(false) and CPU.V(false)");

     }


     // now copy the inverse part (if it exists)

     if (V(true) && cpu.V(true)) {

       qudaMemcpy(packClover, cloverInv, bytes, cudaMemcpyDeviceToHost);

         if (precision == QUDA_HALF_PRECISION)

           qudaMemcpy(packCloverNorm, invNorm, norm_bytes, cudaMemcpyDeviceToHost);

       copyGenericClover(cpu, *this, true, QUDA_CPU_FIELD_LOCATION, 0, packClover, 0, packCloverNorm);

     } else if ((V(true) && !cpu.V(true)) || (!V(true) && cpu.V(true))) {

       errorQuda("Mismatch between Clover field GPU V(true) and CPU.V(true)");

     }


     pool_pinned_free(packClover);


     qudaDeviceSynchronize();

   }


   void cudaCloverField::copy_to_buffer(void *buffer) const

   {


     size_t buffer_offset = 0;

     if (V(false)) { // direct

       qudaMemcpy(buffer, clover, bytes, cudaMemcpyDeviceToHost);

       if (precision < QUDA_SINGLE_PRECISION) {

         qudaMemcpy(static_cast<char *>(buffer) + bytes, norm, norm_bytes, cudaMemcpyDeviceToHost);

       }

       buffer_offset += bytes + norm_bytes;

     }


     if (V(true)) { // inverse

       qudaMemcpy(static_cast<char *>(buffer) + buffer_offset, cloverInv, bytes, cudaMemcpyDeviceToHost);

       if (precision < QUDA_SINGLE_PRECISION) {

         qudaMemcpy(static_cast<char *>(buffer) + buffer_offset + bytes, invNorm, norm_bytes, cudaMemcpyDeviceToHost);

       }

     }

   }


   void cudaCloverField::copy_from_buffer(void *buffer)

   {


     size_t buffer_offset = 0;

     if (V(false)) { // direct

       qudaMemcpy(clover, static_cast<char *>(buffer), bytes, cudaMemcpyHostToDevice);

       if (precision < QUDA_SINGLE_PRECISION) {

         qudaMemcpy(norm, static_cast<char *>(buffer) + bytes, norm_bytes, cudaMemcpyHostToDevice);

       }

       buffer_offset += bytes + norm_bytes;

     }


     if (V(true)) { // inverse

       qudaMemcpy(cloverInv, static_cast<char *>(buffer) + buffer_offset, bytes, cudaMemcpyHostToDevice);

       if (precision < QUDA_SINGLE_PRECISION) {

         qudaMemcpy(invNorm, static_cast<char *>(buffer) + buffer_offset + bytes, norm_bytes, cudaMemcpyHostToDevice);

       }

     }

   }


   void cudaCloverField::prefetch(QudaFieldLocation mem_space, qudaStream_t stream) const

   {

     prefetch(mem_space, stream, CloverPrefetchType::BOTH_CLOVER_PREFETCH_TYPE);

   }


   void cudaCloverField::prefetch(QudaFieldLocation mem_space, qudaStream_t stream, CloverPrefetchType type,

                                  QudaParity parity) const

   {

     if (is_prefetch_enabled()) {

       auto clover_parity = clover;

       auto norm_parity = norm;

       auto cloverInv_parity = cloverInv;

       auto invNorm_parity = invNorm;

       auto bytes_parity = bytes;

       auto norm_bytes_parity = norm_bytes;

       if (parity != QUDA_INVALID_PARITY) {

         bytes_parity /= 2;

         norm_bytes_parity /= 2;

         if (parity == QUDA_EVEN_PARITY) {

           clover_parity = even;

           norm_parity = evenNorm;

           cloverInv_parity = evenInv;

           invNorm_parity = evenInvNorm;

         } else { // odd

           clover_parity = odd;

           norm_parity = oddNorm;

           cloverInv_parity = oddInv;

           invNorm_parity = oddInvNorm;

         }

       }


       switch (type) {

       case CloverPrefetchType::BOTH_CLOVER_PREFETCH_TYPE:

         if (clover_parity) qudaMemPrefetchAsync(clover_parity, bytes_parity, mem_space, stream);

         if (norm_parity) qudaMemPrefetchAsync(norm_parity, norm_bytes_parity, mem_space, stream);

         if (clover_parity != cloverInv_parity) {

           if (cloverInv_parity) qudaMemPrefetchAsync(cloverInv_parity, bytes_parity, mem_space, stream);

           if (invNorm_parity) qudaMemPrefetchAsync(invNorm_parity, norm_bytes_parity, mem_space, stream);

         }

         break;

       case CloverPrefetchType::CLOVER_CLOVER_PREFETCH_TYPE:

         if (clover_parity) qudaMemPrefetchAsync(clover_parity, bytes_parity, mem_space, stream);

         if (norm_parity) qudaMemPrefetchAsync(norm_parity, norm_bytes_parity, mem_space, stream);

         break;

       case CloverPrefetchType::INVERSE_CLOVER_PREFETCH_TYPE:

         if (cloverInv_parity) qudaMemPrefetchAsync(cloverInv_parity, bytes_parity, mem_space, stream);

         if (invNorm_parity) qudaMemPrefetchAsync(invNorm_parity, norm_bytes_parity, mem_space, stream);

         break;

       default: errorQuda("Invalid CloverPrefetchType.");

       }

     }

   }


   void cudaCloverField::compute(const cudaGaugeField &gauge) { computeClover(*this, gauge, 1.0); }


   cpuCloverField::cpuCloverField(const CloverFieldParam &param) : CloverField(param) {


     if (create == QUDA_NULL_FIELD_CREATE || create == QUDA_ZERO_FIELD_CREATE) {

       if(order != QUDA_PACKED_CLOVER_ORDER) {errorQuda("cpuCloverField only supports QUDA_PACKED_CLOVER_ORDER");}

       clover = (void *) safe_malloc(bytes);

       if (precision == QUDA_HALF_PRECISION) norm = (void *) safe_malloc(norm_bytes);

       if(param.inverse) {

         cloverInv = (void *) safe_malloc(bytes);

         if (precision == QUDA_HALF_PRECISION) invNorm = (void *) safe_malloc(norm_bytes);

       }


       if(create == QUDA_ZERO_FIELD_CREATE) {

         memset(clover, '\0', bytes);

         if(param.inverse) memset(cloverInv, '\0', bytes);

         if(precision == QUDA_HALF_PRECISION) memset(norm, '\0', norm_bytes);

         if(param.inverse && precision ==QUDA_HALF_PRECISION) memset(invNorm, '\0', norm_bytes);

       }

     } else if (create == QUDA_REFERENCE_FIELD_CREATE) {

       clover = param.clover;

       norm = param.norm;

       cloverInv = param.cloverInv;

       invNorm = param.invNorm;

     } else {

       errorQuda("Create type %d not supported", create);

     }


     if (param.pad != 0) errorQuda("%s pad must be zero", __func__);

   }


   cpuCloverField::~cpuCloverField()

   {

     if (create != QUDA_REFERENCE_FIELD_CREATE) {

       if (clover) host_free(clover);

       if (norm) host_free(norm);

       if (cloverInv) host_free(cloverInv);

       if (invNorm) host_free(invNorm);

     }

   }


   void cpuCloverField::copy_to_buffer(void *buffer) const

   {


     size_t buffer_offset = 0;

     if (V(false)) { // direct

       std::memcpy(static_cast<char *>(buffer), clover, bytes);

       if (precision < QUDA_SINGLE_PRECISION) { std::memcpy(static_cast<char *>(buffer) + bytes, norm, norm_bytes); }

       buffer_offset += bytes + norm_bytes;

     }


     if (V(true)) { // inverse

       std::memcpy(static_cast<char *>(buffer) + buffer_offset, cloverInv, bytes);

       if (precision < QUDA_SINGLE_PRECISION) {

         std::memcpy(static_cast<char *>(buffer) + buffer_offset + bytes, invNorm, norm_bytes);

       }

     }

   }


   void cpuCloverField::copy_from_buffer(void *buffer)

   {


     size_t buffer_offset = 0;

     if (V(false)) { // direct

       std::memcpy(clover, static_cast<char *>(buffer), bytes);

       if (precision < QUDA_SINGLE_PRECISION) { std::memcpy(norm, static_cast<char *>(buffer) + bytes, norm_bytes); }

       buffer_offset += bytes + norm_bytes;

     }


     if (V(true)) { // inverse

       std::memcpy(cloverInv, static_cast<char *>(buffer) + buffer_offset, bytes);

       if (precision < QUDA_SINGLE_PRECISION) {

         std::memcpy(invNorm, static_cast<char *>(buffer) + buffer_offset + bytes, norm_bytes);

       }

     }

   }


   // This doesn't really live here, but is fine for the moment

   std::ostream& operator<<(std::ostream& output, const CloverFieldParam& param)

   {

     output << static_cast<const LatticeFieldParam&>(param);

     output << "direct = "    << param.direct << std::endl;

     output << "inverse = "   << param.inverse << std::endl;

     output << "clover = "    << param.clover << std::endl;

     output << "norm = "      << param.norm << std::endl;

     output << "cloverInv = " << param.cloverInv << std::endl;

     output << "invNorm = "   << param.invNorm << std::endl;

     output << "csw = "       << param.csw << std::endl;

     output << "coeff = "     << param.coeff << std::endl;

     output << "twisted = "   << param.twisted << std::endl;

     output << "mu2 = "       << param.mu2 << std::endl;

     output << "rho = "       << param.rho << std::endl;

     output << "order = "     << param.order << std::endl;

     output << "create = "    << param.create << std::endl;

     return output;  // for multiple << operators.

   }


   ColorSpinorParam colorSpinorParam(const CloverField &a, bool inverse) {


     if (a.Precision() == QUDA_HALF_PRECISION)

       errorQuda("Casting a CloverField into ColorSpinorField not possible in half precision");


     ColorSpinorParam spinor_param;

     // 72 = 9 * 4 * 2

     spinor_param.nColor = 9;

     spinor_param.nSpin = 4;

     spinor_param.nDim = a.Ndim();

     for (int d=0; d<a.Ndim(); d++) spinor_param.x[d] = a.X()[d];

     spinor_param.setPrecision(a.Precision());

     spinor_param.pad = a.Pad();

     spinor_param.siteSubset = QUDA_FULL_SITE_SUBSET;

     spinor_param.siteOrder = QUDA_EVEN_ODD_SITE_ORDER;

     spinor_param.fieldOrder = a.Precision() == QUDA_DOUBLE_PRECISION ?

       QUDA_FLOAT2_FIELD_ORDER : QUDA_FLOAT4_FIELD_ORDER;

     spinor_param.gammaBasis = QUDA_UKQCD_GAMMA_BASIS;

     spinor_param.create = QUDA_REFERENCE_FIELD_CREATE;

     spinor_param.v = (void*)a.V(inverse);

     spinor_param.location = a.Location();

     return spinor_param;

   }


   // Return the L2 norm squared of the clover field

   double norm2(const CloverField &a, bool inverse) {

     ColorSpinorField *b = ColorSpinorField::Create(colorSpinorParam(a, inverse));

     double nrm2 = blas::norm2(*b);

     delete b;

     return nrm2;

   }


   // Return the L1 norm of the clover field

   double norm1(const CloverField &a, bool inverse) {

     ColorSpinorField *b = ColorSpinorField::Create(colorSpinorParam(a, inverse));

     double nrm1 = blas::norm1(*b);

     delete b;

     return nrm1;

   }


 } // namespace quda

blas_quda.h

quda::CloverField
Definition: clover_field.h:106

quda::CloverField::Norm
void * Norm(bool inverse=false)
Definition: clover_field.h:139

quda::CloverField::bytes
size_t bytes
Definition: clover_field.h:109

quda::CloverField::order
QudaCloverFieldOrder order
Definition: clover_field.h:127

quda::CloverField::twisted
bool twisted
Definition: clover_field.h:123

quda::CloverField::real_length
size_t real_length
Definition: clover_field.h:112

quda::CloverField::nSpin
int nSpin
Definition: clover_field.h:114

quda::CloverField::norm_bytes
size_t norm_bytes
Definition: clover_field.h:110

quda::CloverField::invNorm
void * invNorm
Definition: clover_field.h:119

quda::CloverField::nColor
int nColor
Definition: clover_field.h:113

quda::CloverField::Create
static CloverField * Create(const CloverFieldParam &param)
Definition: clover_field.cpp:65

quda::CloverField::NormBytes
size_t NormBytes() const
Definition: clover_field.h:172

quda::CloverField::setRho
void setRho(double rho)
Bakes in the rho factor into the clover field, (for real diagonal additive Hasenbusch),...
Definition: clover_field.cpp:80

quda::CloverField::clover
void * clover
Definition: clover_field.h:116

quda::CloverField::V
void * V(bool inverse=false)
Definition: clover_field.h:138

quda::CloverField::isNative
bool isNative() const
Definition: clover_field.h:152

quda::CloverField::cloverInv
void * cloverInv
Definition: clover_field.h:118

quda::CloverField::create
QudaFieldCreate create
Definition: clover_field.h:128

quda::CloverField::rho
double rho
Definition: clover_field.h:125

quda::CloverField::CloverField
CloverField(const CloverFieldParam &param)
Definition: clover_field.cpp:39

quda::CloverField::~CloverField
virtual ~CloverField()
Definition: clover_field.cpp:63

quda::CloverField::mu2
double mu2
Definition: clover_field.h:124

quda::CloverField::norm
void * norm
Definition: clover_field.h:117

quda::CloverField::Bytes
size_t Bytes() const
Definition: clover_field.h:167

quda::CloverField::length
size_t length
Definition: clover_field.h:111

quda::ColorSpinorField
Definition: color_spinor_field.h:379

quda::ColorSpinorField::Create
static ColorSpinorField * Create(const ColorSpinorParam &param)
Definition: color_spinor_field.cpp:714

quda::ColorSpinorParam
Definition: color_spinor_field.h:131

quda::ColorSpinorParam::gammaBasis
QudaGammaBasis gammaBasis
Definition: color_spinor_field.h:145

quda::ColorSpinorParam::nColor
int nColor
Definition: color_spinor_field.h:136

quda::ColorSpinorParam::location
QudaFieldLocation location
Definition: color_spinor_field.h:134

quda::ColorSpinorParam::setPrecision
void setPrecision(QudaPrecision precision, QudaPrecision ghost_precision=QUDA_INVALID_PRECISION, bool force_native=false)
Definition: color_spinor_field.h:172

quda::ColorSpinorParam::fieldOrder
QudaFieldOrder fieldOrder
Definition: color_spinor_field.h:144

quda::ColorSpinorParam::siteOrder
QudaSiteOrder siteOrder
Definition: color_spinor_field.h:142

quda::ColorSpinorParam::nSpin
int nSpin
Definition: color_spinor_field.h:137

quda::ColorSpinorParam::create
QudaFieldCreate create
Definition: color_spinor_field.h:146

quda::ColorSpinorParam::v
void * v
Definition: color_spinor_field.h:156

quda::LatticeField
Definition: lattice_field.h:145

quda::LatticeField::stride
size_t stride
Definition: lattice_field.h:160

quda::LatticeField::nDim
int nDim
Definition: lattice_field.h:166

quda::LatticeField::Pad
int Pad() const
Definition: lattice_field.h:552

quda::LatticeField::Precision
QudaPrecision Precision() const
Definition: lattice_field.h:567

quda::LatticeField::Location
QudaFieldLocation Location() const
Definition: lattice_field.cpp:683

quda::LatticeField::precision
QudaPrecision precision
Definition: lattice_field.h:178

quda::LatticeField::volumeCB
size_t volumeCB
Definition: lattice_field.h:152

quda::LatticeField::X
const int * X() const
Definition: lattice_field.h:505

quda::LatticeField::checkField
void checkField(const LatticeField &a) const
Definition: lattice_field.cpp:653

quda::LatticeField::Ndim
int Ndim() const
Definition: lattice_field.h:500

quda::LatticeField::total_bytes
size_t total_bytes
Definition: lattice_field.h:163

quda::cpuCloverField
Definition: clover_field.h:332

quda::cpuCloverField::~cpuCloverField
virtual ~cpuCloverField()
Definition: clover_field.cpp:394

quda::cpuCloverField::copy_to_buffer
virtual void copy_to_buffer(void *buffer) const
Copy all contents of the field to a host buffer.
Definition: clover_field.cpp:404

quda::cpuCloverField::cpuCloverField
cpuCloverField(const CloverFieldParam &param)
Definition: clover_field.cpp:365

quda::cpuCloverField::copy_from_buffer
virtual void copy_from_buffer(void *buffer)
Copy all contents of the field from a host buffer to this field.
Definition: clover_field.cpp:422

quda::cudaCloverField
Definition: clover_field.h:253

quda::cudaCloverField::copy
void copy(const CloverField &src, bool inverse=true)
Copy into this CloverField from the generic CloverField src.
Definition: clover_field.cpp:174

quda::cudaCloverField::loadCPUField
void loadCPUField(const cpuCloverField &cpu)
Definition: clover_field.cpp:232

quda::cudaCloverField::cudaCloverField
cudaCloverField(const CloverFieldParam &param)
Definition: clover_field.cpp:85

quda::cudaCloverField::copy_from_buffer
virtual void copy_from_buffer(void *buffer)
Copy all contents of the field from a host buffer to this field.
Definition: clover_field.cpp:287

quda::cudaCloverField::saveCPUField
void saveCPUField(cpuCloverField &cpu) const
Definition: clover_field.cpp:234

quda::cudaCloverField::copy_to_buffer
virtual void copy_to_buffer(void *buffer) const
Copy all contents of the field to a host buffer.
Definition: clover_field.cpp:267

quda::cudaCloverField::~cudaCloverField
virtual ~cudaCloverField()
Definition: clover_field.cpp:162

quda::cudaCloverField::prefetch
void prefetch(QudaFieldLocation mem_space, qudaStream_t stream=0) const
If managed memory and prefetch is enabled, prefetch the clover, the norm field (as appropriate),...
Definition: clover_field.cpp:307

quda::cudaGaugeField
Definition: gauge_field.h:449

clover_field.h

color_spinor_field.h

V
int V
Definition: host_utils.cpp:37

memset
void * memset(void *s, int c, size_t n)

parity
QudaParity parity
Definition: covdev_test.cpp:40

nColor
const int nColor
Definition: covdev_test.cpp:44

QUDA_QDPJIT_CLOVER_ORDER
@ QUDA_QDPJIT_CLOVER_ORDER
Definition: enum_quda.h:259

QUDA_PACKED_CLOVER_ORDER
@ QUDA_PACKED_CLOVER_ORDER
Definition: enum_quda.h:258

QUDA_CUDA_FIELD_LOCATION
@ QUDA_CUDA_FIELD_LOCATION
Definition: enum_quda.h:326

QUDA_CPU_FIELD_LOCATION
@ QUDA_CPU_FIELD_LOCATION
Definition: enum_quda.h:325

QUDA_FULL_SITE_SUBSET
@ QUDA_FULL_SITE_SUBSET
Definition: enum_quda.h:333

QUDA_UKQCD_GAMMA_BASIS
@ QUDA_UKQCD_GAMMA_BASIS
Definition: enum_quda.h:369

QUDA_EVEN_PARITY
@ QUDA_EVEN_PARITY
Definition: enum_quda.h:284

QUDA_INVALID_PARITY
@ QUDA_INVALID_PARITY
Definition: enum_quda.h:284

QudaFieldLocation
enum QudaFieldLocation_s QudaFieldLocation

QUDA_EVEN_ODD_SITE_ORDER
@ QUDA_EVEN_ODD_SITE_ORDER
Definition: enum_quda.h:340

QUDA_DOUBLE_PRECISION
@ QUDA_DOUBLE_PRECISION
Definition: enum_quda.h:65

QUDA_SINGLE_PRECISION
@ QUDA_SINGLE_PRECISION
Definition: enum_quda.h:64

QUDA_QUARTER_PRECISION
@ QUDA_QUARTER_PRECISION
Definition: enum_quda.h:62

QUDA_HALF_PRECISION
@ QUDA_HALF_PRECISION
Definition: enum_quda.h:63

QUDA_FLOAT2_FIELD_ORDER
@ QUDA_FLOAT2_FIELD_ORDER
Definition: enum_quda.h:348

QUDA_FLOAT4_FIELD_ORDER
@ QUDA_FLOAT4_FIELD_ORDER
Definition: enum_quda.h:349

QUDA_ZERO_FIELD_CREATE
@ QUDA_ZERO_FIELD_CREATE
Definition: enum_quda.h:361

QUDA_REFERENCE_FIELD_CREATE
@ QUDA_REFERENCE_FIELD_CREATE
Definition: enum_quda.h:363

QUDA_NULL_FIELD_CREATE
@ QUDA_NULL_FIELD_CREATE
Definition: enum_quda.h:360

QudaParity
enum QudaParity_s QudaParity

gauge_field.h

pool_pinned_malloc
#define pool_pinned_malloc(size)
Definition: malloc_quda.h:172

pool_device_malloc
#define pool_device_malloc(size)
Definition: malloc_quda.h:170

safe_malloc
#define safe_malloc(size)
Definition: malloc_quda.h:106

pool_pinned_free
#define pool_pinned_free(ptr)
Definition: malloc_quda.h:173

pool_device_free
#define pool_device_free(ptr)
Definition: malloc_quda.h:171

host_free
#define host_free(ptr)
Definition: malloc_quda.h:115

quda::blas::norm1
double norm1(const ColorSpinorField &b)

quda::blas::bytes
unsigned long long bytes

quda::blas::norm2
double norm2(const ColorSpinorField &a)

quda
Definition: blas_lapack.h:24

quda::colorSpinorParam
ColorSpinorParam colorSpinorParam(const CloverField &a, bool inverse)
Definition: clover_field.cpp:460

quda::norm2
double norm2(const CloverField &a, bool inverse=false)
Definition: clover_field.cpp:485

quda::inverse
__device__ __host__ Matrix< T, 3 > inverse(const Matrix< T, 3 > &u)
Definition: quda_matrix.h:605

quda::copyGenericClover
void copyGenericClover(CloverField &out, const CloverField &in, bool inverse, QudaFieldLocation location, void *Out=0, void *In=0, void *outNorm=0, void *inNorm=0)
This generic function is used for copying the clover field where in the input and output can be in an...

quda::stream
qudaStream_t * stream
Definition: cuda_color_spinor_field.cpp:644

quda::norm1
double norm1(const CloverField &u, bool inverse=false)
Definition: clover_field.cpp:493

quda::computeClover
void computeClover(CloverField &clover, const GaugeField &fmunu, double coeff)
Driver for computing the clover field from the field strength tensor.

quda::CloverPrefetchType
CloverPrefetchType
Definition: clover_field.h:28

quda::CloverPrefetchType::BOTH_CLOVER_PREFETCH_TYPE
@ BOTH_CLOVER_PREFETCH_TYPE

quda::CloverPrefetchType::INVERSE_CLOVER_PREFETCH_TYPE
@ INVERSE_CLOVER_PREFETCH_TYPE

quda::CloverPrefetchType::CLOVER_CLOVER_PREFETCH_TYPE
@ CLOVER_CLOVER_PREFETCH_TYPE

quda::reorder_location
QudaFieldLocation reorder_location()
Return whether data is reordered on the CPU or GPU. This can set at QUDA initialization using the env...
Definition: lattice_field.cpp:748

quda::norm
__host__ __device__ ValueType norm(const complex< ValueType > &z)
Returns the magnitude of z squared.
Definition: complex_quda.h:1088

quda::is_prefetch_enabled
bool is_prefetch_enabled()
Definition: malloc.cpp:198

quda::operator<<
std::ostream & operator<<(std::ostream &output, const CloverFieldParam &param)
Definition: clover_field.cpp:441

param
QudaGaugeParam param
Definition: pack_test.cpp:18

qudaMemPrefetchAsync
#define qudaMemPrefetchAsync(ptr, count, mem_space, stream)
Definition: quda_api.h:231

qudaMemcpy
#define qudaMemcpy(dst, src, count, kind)
Definition: quda_api.h:204

qudaStream_t
cudaStream_t qudaStream_t
Definition: quda_api.h:9

qudaDeviceSynchronize
#define qudaDeviceSynchronize()
Definition: quda_api.h:250

quda_internal.h

ALIGNMENT_ADJUST
#define ALIGNMENT_ADJUST(n)
Definition: quda_internal.h:42

QudaGaugeParam_s::location
QudaFieldLocation location
Definition: quda.h:33

quda::CloverFieldParam
Definition: clover_field.h:35

quda::CloverFieldParam::CloverFieldParam
CloverFieldParam()
Definition: clover_field.h:71

quda::LatticeFieldParam
Definition: lattice_field.h:48

quda::LatticeFieldParam::pad
int pad
Definition: lattice_field.h:70

quda::LatticeFieldParam::precision
QudaPrecision precision
Definition: lattice_field.h:52

quda::LatticeFieldParam::nDim
int nDim
Definition: lattice_field.h:65

quda::LatticeFieldParam::x
int x[QUDA_MAX_DIM]
Definition: lattice_field.h:68

quda::LatticeFieldParam::siteSubset
QudaSiteSubset siteSubset
Definition: lattice_field.h:72

errorQuda
#define errorQuda(...)
Definition: util_quda.h:120