quda-ref/v1.1.0/cpu__gauge__field_8cpp_source.html

 #include <quda_internal.h>

 #include <gauge_field.h>

 #include <assert.h>

 #include <string.h>

 #include <typeinfo>


 namespace quda {


   cpuGaugeField::cpuGaugeField(const GaugeFieldParam &param) :

     GaugeField(param)

   {

     if (precision == QUDA_HALF_PRECISION) {

       errorQuda("CPU fields do not support half precision");

     }

     if (precision == QUDA_QUARTER_PRECISION) {

       errorQuda("CPU fields do not support quarter precision");

     }

     if (pad != 0) {

       errorQuda("CPU fields do not support non-zero padding");

     }

     if (reconstruct != QUDA_RECONSTRUCT_NO && reconstruct != QUDA_RECONSTRUCT_10) {

       errorQuda("Reconstruction type %d not supported", reconstruct);

     }

     if (reconstruct == QUDA_RECONSTRUCT_10 && link_type != QUDA_ASQTAD_MOM_LINKS) {

       errorQuda("10-reconstruction only supported with momentum links");

     }


     int siteDim=0;

     if (geometry == QUDA_SCALAR_GEOMETRY) siteDim = 1;

     else if (geometry == QUDA_VECTOR_GEOMETRY) siteDim = nDim;

     else if (geometry == QUDA_TENSOR_GEOMETRY) siteDim = nDim * (nDim-1) / 2;

     else if (geometry == QUDA_COARSE_GEOMETRY) siteDim = 2*nDim;

     else errorQuda("Unknown geometry type %d", geometry);


     // compute the correct bytes size for these padded field orders

     if (order == QUDA_TIFR_PADDED_GAUGE_ORDER) {

       bytes = siteDim * (x[0]*x[1]*(x[2]+4)*x[3]) * nInternal * precision;

     } else if (order == QUDA_BQCD_GAUGE_ORDER) {

       bytes = siteDim * (x[0]+4)*(x[1]+2)*(x[2]+2)*(x[3]+2) * nInternal * precision;

     } else if (order == QUDA_MILC_SITE_GAUGE_ORDER) {

       bytes = volume * site_size;

     }


     if (order == QUDA_QDP_GAUGE_ORDER) {

       gauge = (void**) safe_malloc(siteDim * sizeof(void*));


       for (int d=0; d<siteDim; d++) {

         size_t nbytes = volume * nInternal * precision;

         if (create == QUDA_NULL_FIELD_CREATE || create == QUDA_ZERO_FIELD_CREATE) {

           gauge[d] = nbytes ? safe_malloc(nbytes) : nullptr;

           if (create == QUDA_ZERO_FIELD_CREATE && nbytes) memset(gauge[d], 0, nbytes);

         } else if (create == QUDA_REFERENCE_FIELD_CREATE) {

           gauge[d] = ((void **)param.gauge)[d];

         } else {

           errorQuda("Unsupported creation type %d", create);

         }

       }


     } else if (order == QUDA_CPS_WILSON_GAUGE_ORDER || order == QUDA_MILC_GAUGE_ORDER  ||

                order == QUDA_BQCD_GAUGE_ORDER || order == QUDA_TIFR_GAUGE_ORDER ||

                order == QUDA_TIFR_PADDED_GAUGE_ORDER || order == QUDA_MILC_SITE_GAUGE_ORDER) {


       if (order == QUDA_MILC_SITE_GAUGE_ORDER && create != QUDA_REFERENCE_FIELD_CREATE) {

         errorQuda("MILC site gauge order only supported for reference fields");

       }


       if (create == QUDA_NULL_FIELD_CREATE || create == QUDA_ZERO_FIELD_CREATE) {

         gauge = bytes ? (void **)safe_malloc(bytes) : nullptr;

         if (create == QUDA_ZERO_FIELD_CREATE && bytes) memset(gauge, 0, bytes);

       } else if (create == QUDA_REFERENCE_FIELD_CREATE) {

         gauge = (void**) param.gauge;

       } else {

         errorQuda("Unsupported creation type %d", create);

       }


     } else {

       errorQuda("Unsupported gauge order type %d", order);

     }


     // no need to exchange data if this is a momentum field

     if (link_type != QUDA_ASQTAD_MOM_LINKS) {

       // Ghost zone is always 2-dimensional

       for (int i=0; i<nDim; i++) {

         size_t nbytes = nFace * surface[i] * nInternal * precision;

         ghost[i] = nbytes ? safe_malloc(nbytes) : nullptr;

         ghost[i+4] = (nbytes && geometry == QUDA_COARSE_GEOMETRY) ? safe_malloc(nbytes) : nullptr;

       }


       if (ghostExchange == QUDA_GHOST_EXCHANGE_PAD) {

         // exchange the boundaries if a non-trivial field

         if (create != QUDA_NULL_FIELD_CREATE && create != QUDA_ZERO_FIELD_CREATE &&

             (geometry == QUDA_VECTOR_GEOMETRY || geometry == QUDA_COARSE_GEOMETRY) )

           exchangeGhost(geometry == QUDA_VECTOR_GEOMETRY ? QUDA_LINK_BACKWARDS : QUDA_LINK_BIDIRECTIONAL);

       }

     }


     // compute the fat link max now in case it is needed later (i.e., for half precision)

     if (param.compute_fat_link_max) fat_link_max = this->abs_max();

   }


   cpuGaugeField::~cpuGaugeField()

   {

     int siteDim = 0;

     if (geometry == QUDA_SCALAR_GEOMETRY) siteDim = 1;

     else if (geometry == QUDA_VECTOR_GEOMETRY) siteDim = nDim;

     else if (geometry == QUDA_TENSOR_GEOMETRY) siteDim = nDim * (nDim-1) / 2;

     else if (geometry == QUDA_COARSE_GEOMETRY) siteDim = 2*nDim;

     else errorQuda("Unknown geometry type %d", geometry);


     if (create == QUDA_NULL_FIELD_CREATE || create == QUDA_ZERO_FIELD_CREATE) {

       if (order == QUDA_QDP_GAUGE_ORDER) {

         for (int d=0; d<siteDim; d++) {

           if (gauge[d]) host_free(gauge[d]);

         }

         if (gauge) host_free(gauge);

       } else {

         if (gauge) host_free(gauge);

       }

     } else { // QUDA_REFERENCE_FIELD_CREATE

       if (order == QUDA_QDP_GAUGE_ORDER){

         if (gauge) host_free(gauge);

       }

     }


     if (link_type != QUDA_ASQTAD_MOM_LINKS) {

       for (int i=0; i<nDim; i++) {

         if (ghost[i]) host_free(ghost[i]);

         if (ghost[i+4] && geometry == QUDA_COARSE_GEOMETRY) host_free(ghost[i+4]);

       }

     }

   }


   // This does the exchange of the gauge field ghost zone and places it

   // into the ghost array.

   void cpuGaugeField::exchangeGhost(QudaLinkDirection link_direction) {

     if (geometry != QUDA_VECTOR_GEOMETRY && geometry != QUDA_COARSE_GEOMETRY)

       errorQuda("Cannot exchange for %d geometry gauge field", geometry);


     if ( (link_direction == QUDA_LINK_BIDIRECTIONAL || link_direction == QUDA_LINK_FORWARDS) && geometry != QUDA_COARSE_GEOMETRY)

       errorQuda("Cannot request exchange of forward links on non-coarse geometry");


     void *send[2*QUDA_MAX_DIM];

     for (int d=0; d<nDim; d++) {

       send[d] = safe_malloc(nFace*surface[d]*nInternal*precision);

       if (geometry == QUDA_COARSE_GEOMETRY) send[d+4] = safe_malloc(nFace*surface[d]*nInternal*precision);

     }


     if (link_direction == QUDA_LINK_BACKWARDS || link_direction == QUDA_LINK_BIDIRECTIONAL) {

       // get the links into contiguous buffers

       extractGaugeGhost(*this, send, true);


       // communicate between nodes

       exchange(ghost, send, QUDA_FORWARDS);

     }


     // repeat if requested and links are bi-directional

     if (link_direction == QUDA_LINK_FORWARDS || link_direction == QUDA_LINK_BIDIRECTIONAL) {

       extractGaugeGhost(*this, send, true, nDim);

       exchange(ghost+nDim, send+nDim, QUDA_FORWARDS);

     }


     for (int d=0; d<geometry; d++) host_free(send[d]);

   }


   // This does the opposite of exchangeGhost and sends back the ghost

   // zone to the node from which it came and injects it back into the

   // field

   void cpuGaugeField::injectGhost(QudaLinkDirection link_direction) {

     if (geometry != QUDA_VECTOR_GEOMETRY && geometry != QUDA_COARSE_GEOMETRY)

       errorQuda("Cannot exchange for %d geometry gauge field", geometry);


     if (link_direction != QUDA_LINK_BACKWARDS)

       errorQuda("link_direction = %d not supported", link_direction);


     void *recv[2*QUDA_MAX_DIM];

     for (int d=0; d<nDim; d++) recv[d] = safe_malloc(nFace*surface[d]*nInternal*precision);


     // communicate between nodes

     exchange(recv, ghost, QUDA_BACKWARDS);


     // get the links into contiguous buffers

     extractGaugeGhost(*this, recv, false);


     for (int d=0; d<nDim; d++) host_free(recv[d]);

   }


   void cpuGaugeField::exchangeExtendedGhost(const int *R, bool no_comms_fill) {


     void *send[QUDA_MAX_DIM];

     void *recv[QUDA_MAX_DIM];

     size_t bytes[QUDA_MAX_DIM];

     // store both parities and directions in each

     for (int d=0; d<nDim; d++) {

       if (!(comm_dim_partitioned(d) || (no_comms_fill && R[d])) ) continue;

       bytes[d] = surface[d] * R[d] * geometry * nInternal * precision;

       send[d] = safe_malloc(2 * bytes[d]);

       recv[d] = safe_malloc(2 * bytes[d]);

     }


     for (int d=0; d<nDim; d++) {

       if (!(comm_dim_partitioned(d) || (no_comms_fill && R[d])) ) continue;

       //extract into a contiguous buffer

       extractExtendedGaugeGhost(*this, d, R, send, true);


       if (comm_dim_partitioned(d)) {

         // do the exchange

         MsgHandle *mh_recv_back;

         MsgHandle *mh_recv_fwd;

         MsgHandle *mh_send_fwd;

         MsgHandle *mh_send_back;


         mh_recv_back = comm_declare_receive_relative(recv[d], d, -1, bytes[d]);

         mh_recv_fwd  = comm_declare_receive_relative(((char*)recv[d])+bytes[d], d, +1, bytes[d]);

         mh_send_back = comm_declare_send_relative(send[d], d, -1, bytes[d]);

         mh_send_fwd  = comm_declare_send_relative(((char*)send[d])+bytes[d], d, +1, bytes[d]);


         comm_start(mh_recv_back);

         comm_start(mh_recv_fwd);

         comm_start(mh_send_fwd);

         comm_start(mh_send_back);


         comm_wait(mh_send_fwd);

         comm_wait(mh_send_back);

         comm_wait(mh_recv_back);

         comm_wait(mh_recv_fwd);


         comm_free(mh_send_fwd);

         comm_free(mh_send_back);

         comm_free(mh_recv_back);

         comm_free(mh_recv_fwd);

       } else {

         memcpy(static_cast<char*>(recv[d])+bytes[d], send[d], bytes[d]);

         memcpy(recv[d], static_cast<char*>(send[d])+bytes[d], bytes[d]);

       }


       // inject back into the gauge field

       extractExtendedGaugeGhost(*this, d, R, recv, false);

     }


     for (int d=0; d<nDim; d++) {

       if (!(comm_dim_partitioned(d) || (no_comms_fill && R[d])) ) continue;

       host_free(send[d]);

       host_free(recv[d]);

     }


   }


   void cpuGaugeField::exchangeExtendedGhost(const int *R, TimeProfile &profile, bool no_comms_fill) {

     profile.TPSTART(QUDA_PROFILE_COMMS);

     exchangeExtendedGhost(R, no_comms_fill);

     profile.TPSTOP(QUDA_PROFILE_COMMS);

   }


   // defined in cudaGaugeField

   void *create_gauge_buffer(size_t bytes, QudaGaugeFieldOrder order, QudaFieldGeometry geometry);

   void **create_ghost_buffer(size_t bytes[], QudaGaugeFieldOrder order, QudaFieldGeometry geometry);

   void free_gauge_buffer(void *buffer, QudaGaugeFieldOrder order, QudaFieldGeometry geometry);

   void free_ghost_buffer(void **buffer, QudaGaugeFieldOrder order, QudaFieldGeometry geometry);


   void cpuGaugeField::copy(const GaugeField &src) {

     if (this == &src) return;


     checkField(src);


     if (link_type == QUDA_ASQTAD_FAT_LINKS) {

       fat_link_max = src.LinkMax();

       if (fat_link_max == 0.0 && precision < QUDA_SINGLE_PRECISION) fat_link_max = src.abs_max();

     } else {

       fat_link_max = 1.0;

     }


     if (typeid(src) == typeid(cudaGaugeField)) {


       if (reorder_location() == QUDA_CPU_FIELD_LOCATION) {


         if (!src.isNative()) errorQuda("Only native order is supported");

         void *buffer = pool_pinned_malloc(src.Bytes());

         // this copies over both even and odd

         qudaMemcpy(buffer, static_cast<const cudaGaugeField&>(src).Gauge_p(),

                    src.Bytes(), cudaMemcpyDeviceToHost);


         copyGenericGauge(*this, src, QUDA_CPU_FIELD_LOCATION, gauge, buffer);

         pool_pinned_free(buffer);


       } else { // else on the GPU


         void *buffer = create_gauge_buffer(bytes, order, geometry);

         size_t ghost_bytes[8];

         int dstNinternal = reconstruct != QUDA_RECONSTRUCT_NO ? reconstruct : 2*nColor*nColor;

         for (int d=0; d<geometry; d++) ghost_bytes[d] = nFace * surface[d%4] * dstNinternal * precision;

         void **ghost_buffer = (nFace > 0) ? create_ghost_buffer(ghost_bytes, order, geometry) : nullptr;


         if (ghostExchange != QUDA_GHOST_EXCHANGE_EXTENDED) {

           copyGenericGauge(*this, src, QUDA_CUDA_FIELD_LOCATION, buffer, 0, ghost_buffer, 0);

           if (geometry == QUDA_COARSE_GEOMETRY) copyGenericGauge(*this, src, QUDA_CUDA_FIELD_LOCATION, buffer, 0, ghost_buffer, 0, 3); // forwards links if bi-directional

         } else {

           copyExtendedGauge(*this, src, QUDA_CUDA_FIELD_LOCATION, buffer, 0);

         }


         if (order == QUDA_QDP_GAUGE_ORDER) {

           for (int d=0; d<geometry; d++) {

             qudaMemcpy(((void**)gauge)[d], ((void**)buffer)[d], bytes/geometry, cudaMemcpyDeviceToHost);

           }

         } else {

           qudaMemcpy(gauge, buffer, bytes, cudaMemcpyHostToDevice);

         }


         if (order > 4 && ghostExchange == QUDA_GHOST_EXCHANGE_PAD && src.GhostExchange() == QUDA_GHOST_EXCHANGE_PAD && nFace)

           for (int d=0; d<geometry; d++)

             qudaMemcpy(Ghost()[d], ghost_buffer[d], ghost_bytes[d], cudaMemcpyDeviceToHost);


         free_gauge_buffer(buffer, order, geometry);

         if (nFace > 0) free_ghost_buffer(ghost_buffer, order, geometry);

       }


     } else if (typeid(src) == typeid(cpuGaugeField)) {

       // copy field and ghost zone directly

       copyGenericGauge(*this, src, QUDA_CPU_FIELD_LOCATION, gauge,

                        const_cast<void*>(static_cast<const cpuGaugeField&>(src).Gauge_p()));

     } else {

       errorQuda("Invalid gauge field type");

     }


     // if we have copied from a source without a pad then we need to exchange

     if (ghostExchange == QUDA_GHOST_EXCHANGE_PAD &&

         src.GhostExchange() != QUDA_GHOST_EXCHANGE_PAD) {

       exchangeGhost(geometry == QUDA_VECTOR_GEOMETRY ? QUDA_LINK_BACKWARDS : QUDA_LINK_BIDIRECTIONAL);

     }

   }


   void cpuGaugeField::setGauge(void **gauge_)

   {

     if(create != QUDA_REFERENCE_FIELD_CREATE) {

       errorQuda("Setting gauge pointer is only allowed when create="

                 "QUDA_REFERENCE_FIELD_CREATE type\n");

     }

     gauge = gauge_;

   }


   void cpuGaugeField::backup() const {

     if (backed_up) errorQuda("Gauge field already backed up");


     if (order == QUDA_QDP_GAUGE_ORDER) {

       char **buffer = new char*[geometry];

       for (int d=0; d<geometry; d++) {

         buffer[d] = new char[bytes/geometry];

         memcpy(buffer[d], gauge[d], bytes/geometry);

       }

       backup_h = reinterpret_cast<char*>(buffer);

     } else {

       backup_h = new char[bytes];

       memcpy(backup_h, gauge, bytes);

     }


     backed_up = true;

   }


   void cpuGaugeField::restore() const

   {

     if (!backed_up) errorQuda("Cannot restore since not backed up");


     if (order == QUDA_QDP_GAUGE_ORDER) {

       char **buffer = reinterpret_cast<char**>(backup_h);

       for (int d=0; d<geometry; d++) {

         memcpy(gauge[d], buffer[d], bytes/geometry);

         delete []buffer[d];

       }

       delete []buffer;

     } else {

       memcpy(gauge, backup_h, bytes);

       delete []backup_h;

     }


     backed_up = false;

   }


   void cpuGaugeField::zero() {

     if (order != QUDA_QDP_GAUGE_ORDER) {

       memset(gauge, 0, bytes);

     } else {

       for (int g=0; g<geometry; g++) memset(gauge[g], 0, volume * nInternal * precision);

     }

   }


   void cpuGaugeField::copy_to_buffer(void *buffer) const

   {


     if (Order() == QUDA_QDP_GAUGE_ORDER || Order() == QUDA_QDPJIT_GAUGE_ORDER) {

       void *const *p = static_cast<void *const *>(Gauge_p());

       int dbytes = Bytes() / 4;

       static_assert(sizeof(char) == 1, "Assuming sizeof(char) == 1");

       char *dst_buffer = reinterpret_cast<char *>(buffer);

       for (int d = 0; d < 4; d++) { std::memcpy(&dst_buffer[d * dbytes], p[d], dbytes); }

     } else if (Order() == QUDA_CPS_WILSON_GAUGE_ORDER || Order() == QUDA_MILC_GAUGE_ORDER

                || Order() == QUDA_MILC_SITE_GAUGE_ORDER || Order() == QUDA_BQCD_GAUGE_ORDER

                || Order() == QUDA_TIFR_GAUGE_ORDER || Order() == QUDA_TIFR_PADDED_GAUGE_ORDER) {

       const void *p = Gauge_p();

       int bytes = Bytes();

       std::memcpy(buffer, p, bytes);

     } else {

       errorQuda("Unsupported order = %d\n", Order());

     }

   }


   void cpuGaugeField::copy_from_buffer(void *buffer)

   {


     if (Order() == QUDA_QDP_GAUGE_ORDER || Order() == QUDA_QDPJIT_GAUGE_ORDER) {

       void **p = static_cast<void **>(Gauge_p());

       size_t dbytes = Bytes() / 4;

       static_assert(sizeof(char) == 1, "Assuming sizeof(char) == 1");

       const char *dst_buffer = reinterpret_cast<const char *>(buffer);

       for (int d = 0; d < 4; d++) { std::memcpy(p[d], &dst_buffer[d * dbytes], dbytes); }

     } else if (Order() == QUDA_CPS_WILSON_GAUGE_ORDER || Order() == QUDA_MILC_GAUGE_ORDER

                || Order() == QUDA_MILC_SITE_GAUGE_ORDER || Order() == QUDA_BQCD_GAUGE_ORDER

                || Order() == QUDA_TIFR_GAUGE_ORDER || Order() == QUDA_TIFR_PADDED_GAUGE_ORDER) {

       void *p = Gauge_p();

       size_t bytes = Bytes();

       std::memcpy(p, buffer, bytes);

     } else {

       errorQuda("Unsupported order = %d\n", Order());

     }

   }


 /*template <typename Float>

 void print_matrix(const Float &m, unsigned int x) {


   for (int s=0; s<o.Nspin(); s++) {

     std::cout << "x = " << x << ", s = " << s << ", { ";

     for (int c=0; c<o.Ncolor(); c++) {

       std::cout << " ( " << o(x, s, c, 0) << " , " ;

       if (c<o.Ncolor()-1) std::cout << o(x, s, c, 1) << " ) ," ;

       else std::cout << o(x, s, c, 1) << " ) " ;

     }

     std::cout << " } " << std::endl;

   }


 }


 // print out the vector at volume point x

 void cpuColorSpinorField::PrintMatrix(unsigned int x) {


   switch(precision) {

   case QUDA_DOUBLE_PRECISION:

     print_matrix(*order_double, x);

     break;

   case QUDA_SINGLE_PRECISION:

     print_matrix(*order_single, x);

     break;

   default:

     errorQuda("Precision %d not implemented", precision);

   }


 }

 */


 } // namespace quda

quda::GaugeField
Definition: gauge_field.h:200

quda::GaugeField::link_type
QudaLinkType link_type
Definition: gauge_field.h:216

quda::GaugeField::create
QudaFieldCreate create
Definition: gauge_field.h:223

quda::GaugeField::ghost
void * ghost[2 *QUDA_MAX_DIM]
Definition: gauge_field.h:225

quda::GaugeField::nInternal
int nInternal
Definition: gauge_field.h:213

quda::GaugeField::order
QudaGaugeFieldOrder order
Definition: gauge_field.h:214

quda::GaugeField::site_size
size_t site_size
Definition: gauge_field.h:260

quda::GaugeField::nColor
int nColor
Definition: gauge_field.h:208

quda::GaugeField::Order
QudaGaugeFieldOrder Order() const
Definition: gauge_field.h:287

quda::GaugeField::LinkMax
const double & LinkMax() const
Definition: gauge_field.h:321

quda::GaugeField::Bytes
size_t Bytes() const
Definition: gauge_field.h:352

quda::GaugeField::fat_link_max
double fat_link_max
Definition: gauge_field.h:221

quda::GaugeField::bytes
size_t bytes
Definition: gauge_field.h:203

quda::GaugeField::exchange
void exchange(void **recv, void **send, QudaDirection dir) const
Exchange the buffers across all dimensions in a given direction.
Definition: gauge_field.cpp:177

quda::GaugeField::nFace
int nFace
Definition: gauge_field.h:209

quda::GaugeField::isNative
bool isNative() const
Definition: gauge_field.h:350

quda::GaugeField::abs_max
double abs_max(int dim=-1, bool fixed=false) const
Compute the absolute maximum of the field (Linfinity norm)

quda::GaugeField::checkField
void checkField(const LatticeField &) const
Definition: gauge_field.cpp:257

quda::GaugeField::geometry
QudaFieldGeometry geometry
Definition: gauge_field.h:210

quda::GaugeField::reconstruct
QudaReconstructType reconstruct
Definition: gauge_field.h:212

quda::GaugeField::Ghost
const void ** Ghost() const
Definition: gauge_field.h:368

quda::LatticeField::ghostExchange
QudaGhostExchange ghostExchange
Definition: lattice_field.h:193

quda::LatticeField::mh_send_fwd
MsgHandle * mh_send_fwd[2][QUDA_MAX_DIM]
Definition: lattice_field.h:331

quda::LatticeField::backed_up
bool backed_up
Definition: lattice_field.h:409

quda::LatticeField::volume
size_t volume
Definition: lattice_field.h:149

quda::LatticeField::x
int x[QUDA_MAX_DIM]
Definition: lattice_field.h:169

quda::LatticeField::pad
int pad
Definition: lattice_field.h:161

quda::LatticeField::nDim
int nDim
Definition: lattice_field.h:166

quda::LatticeField::precision
QudaPrecision precision
Definition: lattice_field.h:178

quda::LatticeField::ghost_bytes
size_t ghost_bytes
Definition: lattice_field.h:254

quda::LatticeField::R
const int * R() const
Definition: lattice_field.h:557

quda::LatticeField::surface
int surface[QUDA_MAX_DIM]
Definition: lattice_field.h:171

quda::LatticeField::mh_send_back
MsgHandle * mh_send_back[2][QUDA_MAX_DIM]
Definition: lattice_field.h:334

quda::LatticeField::GhostExchange
QudaGhostExchange GhostExchange() const
Definition: lattice_field.h:562

quda::LatticeField::mh_recv_fwd
MsgHandle * mh_recv_fwd[2][QUDA_MAX_DIM]
Definition: lattice_field.h:325

quda::LatticeField::mh_recv_back
MsgHandle * mh_recv_back[2][QUDA_MAX_DIM]
Definition: lattice_field.h:328

quda::LatticeField::backup_h
char * backup_h
Definition: lattice_field.h:407

quda::TimeProfile
Definition: timer.h:174

quda::cpuGaugeField
Definition: gauge_field.h:626

quda::cpuGaugeField::Gauge_p
void * Gauge_p()
Definition: gauge_field.h:688

quda::cpuGaugeField::~cpuGaugeField
virtual ~cpuGaugeField()
Definition: cpu_gauge_field.cpp:102

quda::cpuGaugeField::copy
void copy(const GaugeField &src)
Definition: cpu_gauge_field.cpp:261

quda::cpuGaugeField::copy_from_buffer
virtual void copy_from_buffer(void *buffer)
Copy all contents of the field from a host buffer to this field.
Definition: cpu_gauge_field.cpp:406

quda::cpuGaugeField::setGauge
void setGauge(void **_gauge)
Definition: cpu_gauge_field.cpp:332

quda::cpuGaugeField::backup
void backup() const
Backs up the cpuGaugeField.
Definition: cpu_gauge_field.cpp:341

quda::cpuGaugeField::injectGhost
void injectGhost(QudaLinkDirection link_direction=QUDA_LINK_BACKWARDS)
The opposite of exchangeGhost: take the ghost zone on x, send to node x-1, and inject back into the f...
Definition: cpu_gauge_field.cpp:169

quda::cpuGaugeField::exchangeExtendedGhost
void exchangeExtendedGhost(const int *R, bool no_comms_fill=false)
This does routine will populate the border / halo region of a gauge field that has been created using...
Definition: cpu_gauge_field.cpp:188

quda::cpuGaugeField::zero
void zero()
Definition: cpu_gauge_field.cpp:378

quda::cpuGaugeField::exchangeGhost
void exchangeGhost(QudaLinkDirection link_direction=QUDA_LINK_BACKWARDS)
Exchange the ghost and store store in the padded region.
Definition: cpu_gauge_field.cpp:136

quda::cpuGaugeField::restore
void restore() const
Restores the cpuGaugeField.
Definition: cpu_gauge_field.cpp:359

quda::cpuGaugeField::cpuGaugeField
cpuGaugeField(const GaugeFieldParam &param)
Constructor for cpuGaugeField from a GaugeFieldParam.
Definition: cpu_gauge_field.cpp:9

quda::cpuGaugeField::copy_to_buffer
virtual void copy_to_buffer(void *buffer) const
Copy all contents of the field to a host buffer.
Definition: cpu_gauge_field.cpp:386

quda::cudaGaugeField
Definition: gauge_field.h:449

comm_start
void comm_start(MsgHandle *mh)
Definition: communicator_stack.cpp:165

comm_dim_partitioned
int comm_dim_partitioned(int dim)
Definition: communicator_stack.cpp:74

comm_declare_receive_relative
#define comm_declare_receive_relative(buffer, dim, dir, nbytes)
Definition: comm_quda.h:82

comm_wait
void comm_wait(MsgHandle *mh)
Definition: communicator_stack.cpp:167

comm_free
void comm_free(MsgHandle *&mh)
Definition: communicator_stack.cpp:163

comm_declare_send_relative
#define comm_declare_send_relative(buffer, dim, dir, nbytes)
Definition: comm_quda.h:67

memset
void * memset(void *s, int c, size_t n)

QudaLinkDirection
enum QudaLinkDirection_s QudaLinkDirection

QUDA_CUDA_FIELD_LOCATION
@ QUDA_CUDA_FIELD_LOCATION
Definition: enum_quda.h:326

QUDA_CPU_FIELD_LOCATION
@ QUDA_CPU_FIELD_LOCATION
Definition: enum_quda.h:325

QUDA_LINK_BIDIRECTIONAL
@ QUDA_LINK_BIDIRECTIONAL
Definition: enum_quda.h:497

QUDA_LINK_FORWARDS
@ QUDA_LINK_FORWARDS
Definition: enum_quda.h:497

QUDA_LINK_BACKWARDS
@ QUDA_LINK_BACKWARDS
Definition: enum_quda.h:497

QudaGaugeFieldOrder
enum QudaGaugeFieldOrder_s QudaGaugeFieldOrder

QUDA_RECONSTRUCT_NO
@ QUDA_RECONSTRUCT_NO
Definition: enum_quda.h:70

QUDA_RECONSTRUCT_10
@ QUDA_RECONSTRUCT_10
Definition: enum_quda.h:75

QUDA_SCALAR_GEOMETRY
@ QUDA_SCALAR_GEOMETRY
Definition: enum_quda.h:500

QUDA_VECTOR_GEOMETRY
@ QUDA_VECTOR_GEOMETRY
Definition: enum_quda.h:501

QUDA_TENSOR_GEOMETRY
@ QUDA_TENSOR_GEOMETRY
Definition: enum_quda.h:502

QUDA_COARSE_GEOMETRY
@ QUDA_COARSE_GEOMETRY
Definition: enum_quda.h:503

QudaFieldGeometry
enum QudaFieldGeometry_s QudaFieldGeometry

QUDA_FORWARDS
@ QUDA_FORWARDS
Definition: enum_quda.h:493

QUDA_BACKWARDS
@ QUDA_BACKWARDS
Definition: enum_quda.h:491

QUDA_GHOST_EXCHANGE_EXTENDED
@ QUDA_GHOST_EXCHANGE_EXTENDED
Definition: enum_quda.h:510

QUDA_GHOST_EXCHANGE_PAD
@ QUDA_GHOST_EXCHANGE_PAD
Definition: enum_quda.h:509

QUDA_SINGLE_PRECISION
@ QUDA_SINGLE_PRECISION
Definition: enum_quda.h:64

QUDA_QUARTER_PRECISION
@ QUDA_QUARTER_PRECISION
Definition: enum_quda.h:62

QUDA_HALF_PRECISION
@ QUDA_HALF_PRECISION
Definition: enum_quda.h:63

QUDA_BQCD_GAUGE_ORDER
@ QUDA_BQCD_GAUGE_ORDER
Definition: enum_quda.h:49

QUDA_TIFR_GAUGE_ORDER
@ QUDA_TIFR_GAUGE_ORDER
Definition: enum_quda.h:50

QUDA_QDP_GAUGE_ORDER
@ QUDA_QDP_GAUGE_ORDER
Definition: enum_quda.h:44

QUDA_MILC_SITE_GAUGE_ORDER
@ QUDA_MILC_SITE_GAUGE_ORDER
Definition: enum_quda.h:48

QUDA_CPS_WILSON_GAUGE_ORDER
@ QUDA_CPS_WILSON_GAUGE_ORDER
Definition: enum_quda.h:46

QUDA_TIFR_PADDED_GAUGE_ORDER
@ QUDA_TIFR_PADDED_GAUGE_ORDER
Definition: enum_quda.h:51

QUDA_MILC_GAUGE_ORDER
@ QUDA_MILC_GAUGE_ORDER
Definition: enum_quda.h:47

QUDA_QDPJIT_GAUGE_ORDER
@ QUDA_QDPJIT_GAUGE_ORDER
Definition: enum_quda.h:45

QUDA_ZERO_FIELD_CREATE
@ QUDA_ZERO_FIELD_CREATE
Definition: enum_quda.h:361

QUDA_REFERENCE_FIELD_CREATE
@ QUDA_REFERENCE_FIELD_CREATE
Definition: enum_quda.h:363

QUDA_NULL_FIELD_CREATE
@ QUDA_NULL_FIELD_CREATE
Definition: enum_quda.h:360

QUDA_ASQTAD_MOM_LINKS
@ QUDA_ASQTAD_MOM_LINKS
Definition: enum_quda.h:33

QUDA_ASQTAD_FAT_LINKS
@ QUDA_ASQTAD_FAT_LINKS
Definition: enum_quda.h:31

gauge_field.h

pool_pinned_malloc
#define pool_pinned_malloc(size)
Definition: malloc_quda.h:172

safe_malloc
#define safe_malloc(size)
Definition: malloc_quda.h:106

pool_pinned_free
#define pool_pinned_free(ptr)
Definition: malloc_quda.h:173

host_free
#define host_free(ptr)
Definition: malloc_quda.h:115

quda::blas::bytes
unsigned long long bytes

quda
Definition: blas_lapack.h:24

quda::create_gauge_buffer
void * create_gauge_buffer(size_t bytes, QudaGaugeFieldOrder order, QudaFieldGeometry geometry)
Definition: cuda_gauge_field.cpp:492

quda::create_ghost_buffer
void ** create_ghost_buffer(size_t bytes[], QudaGaugeFieldOrder order, QudaFieldGeometry geometry)
Definition: cuda_gauge_field.cpp:503

quda::copyGenericGauge
void copyGenericGauge(GaugeField &out, const GaugeField &in, QudaFieldLocation location, void *Out=0, void *In=0, void **ghostOut=0, void **ghostIn=0, int type=0)
Definition: copy_gauge.cpp:44

quda::extractGaugeGhost
void extractGaugeGhost(const GaugeField &u, void **ghost, bool extract=true, int offset=0)

quda::extractExtendedGaugeGhost
void extractExtendedGaugeGhost(const GaugeField &u, int dim, const int *R, void **ghost, bool extract)

quda::free_gauge_buffer
void free_gauge_buffer(void *buffer, QudaGaugeFieldOrder order, QudaFieldGeometry geometry)
Definition: cuda_gauge_field.cpp:515

quda::QUDA_PROFILE_COMMS
@ QUDA_PROFILE_COMMS
Definition: timer.h:109

quda::free_ghost_buffer
void free_ghost_buffer(void **buffer, QudaGaugeFieldOrder order, QudaFieldGeometry geometry)
Definition: cuda_gauge_field.cpp:524

quda::reorder_location
QudaFieldLocation reorder_location()
Return whether data is reordered on the CPU or GPU. This can set at QUDA initialization using the env...
Definition: lattice_field.cpp:748

quda::copyExtendedGauge
void copyExtendedGauge(GaugeField &out, const GaugeField &in, QudaFieldLocation location, void *Out=0, void *In=0)

param
QudaGaugeParam param
Definition: pack_test.cpp:18

qudaMemcpy
#define qudaMemcpy(dst, src, count, kind)
Definition: quda_api.h:204

QUDA_MAX_DIM
#define QUDA_MAX_DIM
Maximum number of dimensions supported by QUDA. In practice, no routines make use of more than 5.
Definition: quda_constants.h:17

quda_internal.h

MsgHandle_s
Definition: communicator_mpi.cpp:15

quda::GaugeFieldParam
Definition: gauge_field.h:44

errorQuda
#define errorQuda(...)
Definition: util_quda.h:120