v0.9.0/doc/cpu__gauge__field_8cpp_source.html

 #include <quda_internal.h>
 #include <gauge_field.h>
 #include <assert.h>
 #include <string.h>
 #include <typeinfo>

 namespace quda {

   cpuGaugeField::cpuGaugeField(const GaugeFieldParam &param) :
     GaugeField(param)
   {
     if (precision == QUDA_HALF_PRECISION) {
       errorQuda("CPU fields do not support half precision");
     }
     if (pad != 0) {
       errorQuda("CPU fields do not support non-zero padding");
     }
     if (reconstruct != QUDA_RECONSTRUCT_NO && reconstruct != QUDA_RECONSTRUCT_10) {
       errorQuda("Reconstruction type %d not supported", reconstruct);
     }
     if (reconstruct == QUDA_RECONSTRUCT_10 && order != QUDA_MILC_GAUGE_ORDER && order != QUDA_MILC_SITE_GAUGE_ORDER) {
       errorQuda("10-reconstruction only supported with MILC gauge order");
     }

     int siteDim=0;
     if (geometry == QUDA_SCALAR_GEOMETRY) siteDim = 1;
     else if (geometry == QUDA_VECTOR_GEOMETRY) siteDim = nDim;
     else if (geometry == QUDA_TENSOR_GEOMETRY) siteDim = nDim * (nDim-1) / 2;
     else if (geometry == QUDA_COARSE_GEOMETRY) siteDim = 2*nDim;
     else errorQuda("Unknown geometry type %d", geometry);

     // compute the correct bytes size for these padded field orders
     if (order == QUDA_TIFR_PADDED_GAUGE_ORDER) {
       bytes = siteDim * (x[0]*x[1]*(x[2]+4)*x[3]) * nInternal * precision;
     } else if (order == QUDA_BQCD_GAUGE_ORDER) {
       bytes = siteDim * (x[0]+4)*(x[1]+2)*(x[2]+2)*(x[3]+2) * nInternal * precision;
     } else if (order == QUDA_MILC_SITE_GAUGE_ORDER) {
       bytes = volume * site_size;
     }

     if (order == QUDA_QDP_GAUGE_ORDER) {
       gauge = (void**) safe_malloc(siteDim * sizeof(void*));

       for (int d=0; d<siteDim; d++) {
   size_t nbytes = volume * nInternal * precision;
   if (create == QUDA_NULL_FIELD_CREATE || create == QUDA_ZERO_FIELD_CREATE) {
     gauge[d] = safe_malloc(nbytes);
     if (create == QUDA_ZERO_FIELD_CREATE) memset(gauge[d], 0, nbytes);
   } else if (create == QUDA_REFERENCE_FIELD_CREATE) {
     gauge[d] = ((void**)param.gauge)[d];
   } else {
     errorQuda("Unsupported creation type %d", create);
   }
       }

     } else if (order == QUDA_CPS_WILSON_GAUGE_ORDER || order == QUDA_MILC_GAUGE_ORDER  ||
          order == QUDA_BQCD_GAUGE_ORDER || order == QUDA_TIFR_GAUGE_ORDER ||
          order == QUDA_TIFR_PADDED_GAUGE_ORDER || order == QUDA_MILC_SITE_GAUGE_ORDER) {

       if (order == QUDA_MILC_SITE_GAUGE_ORDER && create != QUDA_REFERENCE_FIELD_CREATE) {
   errorQuda("MILC site gauge order only supported for reference fields");
       }

       if (create == QUDA_NULL_FIELD_CREATE || create == QUDA_ZERO_FIELD_CREATE) {
   gauge = (void **) safe_malloc(bytes);
   if(create == QUDA_ZERO_FIELD_CREATE) memset(gauge, 0, bytes);
       } else if (create == QUDA_REFERENCE_FIELD_CREATE) {
   gauge = (void**) param.gauge;
       } else {
   errorQuda("Unsupported creation type %d", create);
       }

     } else {
       errorQuda("Unsupported gauge order type %d", order);
     }

     // no need to exchange data if this is a momentum field
     if (link_type != QUDA_ASQTAD_MOM_LINKS) {
       // Ghost zone is always 2-dimensional
       for (int i=0; i<nDim; i++) {
   size_t nbytes = nFace * surface[i] * nInternal * precision;
   ghost[i] = nbytes ? safe_malloc(nbytes) : nullptr;
   ghost[i+4] = (nbytes && geometry == QUDA_COARSE_GEOMETRY) ? safe_malloc(nbytes) : nullptr;
       }

       if (ghostExchange == QUDA_GHOST_EXCHANGE_PAD) {
   // exchange the boundaries if a non-trivial field
   if (create != QUDA_NULL_FIELD_CREATE && create != QUDA_ZERO_FIELD_CREATE &&
       (geometry == QUDA_VECTOR_GEOMETRY || geometry == QUDA_COARSE_GEOMETRY) )
     exchangeGhost(geometry == QUDA_VECTOR_GEOMETRY ? QUDA_LINK_BACKWARDS : QUDA_LINK_BIDIRECTIONAL);
       }
     }

     // compute the fat link max now in case it is needed later (i.e., for half precision)
     if (param.compute_fat_link_max) fat_link_max = maxGauge(*this);
   }


   cpuGaugeField::~cpuGaugeField()
   {

     int siteDim = 0;
     if (geometry == QUDA_SCALAR_GEOMETRY) siteDim = 1;
     else if (geometry == QUDA_VECTOR_GEOMETRY) siteDim = nDim;
     else if (geometry == QUDA_TENSOR_GEOMETRY) siteDim = nDim * (nDim-1) / 2;
     else if (geometry == QUDA_COARSE_GEOMETRY) siteDim = 2*nDim;
     else errorQuda("Unknown geometry type %d", geometry);

     if (create == QUDA_NULL_FIELD_CREATE || create == QUDA_ZERO_FIELD_CREATE) {
       if (order == QUDA_QDP_GAUGE_ORDER) {
   for (int d=0; d<siteDim; d++) {
     if (gauge[d]) host_free(gauge[d]);
   }
   if (gauge) host_free(gauge);
       } else {
   if (gauge) host_free(gauge);
       }
     } else { // QUDA_REFERENCE_FIELD_CREATE
       if (order == QUDA_QDP_GAUGE_ORDER){
   if (gauge) host_free(gauge);
       }
     }

     if (link_type != QUDA_ASQTAD_MOM_LINKS) {
       for (int i=0; i<nDim; i++) {
   if (ghost[i]) host_free(ghost[i]);
   if (ghost[i+4] && geometry == QUDA_COARSE_GEOMETRY) host_free(ghost[i+4]);
       }
     }
   }

   // This does the exchange of the gauge field ghost zone and places it
   // into the ghost array.
   void cpuGaugeField::exchangeGhost(QudaLinkDirection link_direction) {
     if (geometry != QUDA_VECTOR_GEOMETRY && geometry != QUDA_COARSE_GEOMETRY)
       errorQuda("Cannot exchange for %d geometry gauge field", geometry);

     if ( (link_direction == QUDA_LINK_BIDIRECTIONAL || link_direction == QUDA_LINK_FORWARDS) && geometry != QUDA_COARSE_GEOMETRY)
       errorQuda("Cannot request exchange of forward links on non-coarse geometry");

     void *send[2*QUDA_MAX_DIM];
     for (int d=0; d<nDim; d++) {
       send[d] = safe_malloc(nFace*surface[d]*nInternal*precision);
       if (geometry == QUDA_COARSE_GEOMETRY) send[d+4] = safe_malloc(nFace*surface[d]*nInternal*precision);
     }

     if (link_direction == QUDA_LINK_BACKWARDS || link_direction == QUDA_LINK_BIDIRECTIONAL) {
       // get the links into contiguous buffers
       extractGaugeGhost(*this, send, true);

       // communicate between nodes
       exchange(ghost, send, QUDA_FORWARDS);
     }

     // repeat if requested and links are bi-directional
     if (link_direction == QUDA_LINK_FORWARDS || link_direction == QUDA_LINK_BIDIRECTIONAL) {
       extractGaugeGhost(*this, send, true, nDim);
       exchange(ghost+nDim, send+nDim, QUDA_FORWARDS);
     }

     for (int d=0; d<geometry; d++) host_free(send[d]);
   }

   // This does the opposite of exchangeGhost and sends back the ghost
   // zone to the node from which it came and injects it back into the
   // field
   void cpuGaugeField::injectGhost(QudaLinkDirection link_direction) {
     if (geometry != QUDA_VECTOR_GEOMETRY && geometry != QUDA_COARSE_GEOMETRY)
       errorQuda("Cannot exchange for %d geometry gauge field", geometry);

     if (link_direction != QUDA_LINK_BACKWARDS)
       errorQuda("link_direction = %d not supported", link_direction);

     void *recv[QUDA_MAX_DIM];
     for (int d=0; d<nDim; d++) recv[d] = safe_malloc(nFace*surface[d]*nInternal*precision);

     // communicate between nodes
     exchange(recv, ghost, QUDA_BACKWARDS);

     // get the links into contiguous buffers
     extractGaugeGhost(*this, recv, false);

     for (int d=0; d<nDim; d++) host_free(recv[d]);
   }

   void cpuGaugeField::exchangeExtendedGhost(const int *R, bool no_comms_fill) {

     void *send[QUDA_MAX_DIM];
     void *recv[QUDA_MAX_DIM];
     size_t bytes[QUDA_MAX_DIM];
     // store both parities and directions in each
     for (int d=0; d<nDim; d++) {
       if (!(comm_dim_partitioned(d) || (no_comms_fill && R[d])) ) continue;
       bytes[d] = surface[d] * R[d] * geometry * nInternal * precision;
       send[d] = safe_malloc(2 * bytes[d]);
       recv[d] = safe_malloc(2 * bytes[d]);
     }

     for (int d=0; d<nDim; d++) {
       if (!(comm_dim_partitioned(d) || (no_comms_fill && R[d])) ) continue;
       //extract into a contiguous buffer
       extractExtendedGaugeGhost(*this, d, R, send, true);

       if (comm_dim_partitioned(d)) {
   // do the exchange
   MsgHandle *mh_recv_back;
   MsgHandle *mh_recv_fwd;
   MsgHandle *mh_send_fwd;
   MsgHandle *mh_send_back;

   mh_recv_back = comm_declare_receive_relative(recv[d], d, -1, bytes[d]);
   mh_recv_fwd  = comm_declare_receive_relative(((char*)recv[d])+bytes[d], d, +1, bytes[d]);
   mh_send_back = comm_declare_send_relative(send[d], d, -1, bytes[d]);
   mh_send_fwd  = comm_declare_send_relative(((char*)send[d])+bytes[d], d, +1, bytes[d]);

   comm_start(mh_recv_back);
   comm_start(mh_recv_fwd);
   comm_start(mh_send_fwd);
   comm_start(mh_send_back);

   comm_wait(mh_send_fwd);
   comm_wait(mh_send_back);
   comm_wait(mh_recv_back);
   comm_wait(mh_recv_fwd);

   comm_free(mh_send_fwd);
   comm_free(mh_send_back);
   comm_free(mh_recv_back);
   comm_free(mh_recv_fwd);
       } else {
   memcpy(static_cast<char*>(recv[d])+bytes[d], send[d], bytes[d]);
   memcpy(recv[d], static_cast<char*>(send[d])+bytes[d], bytes[d]);
       }

       // inject back into the gauge field
       extractExtendedGaugeGhost(*this, d, R, recv, false);
     }

     for (int d=0; d<nDim; d++) {
       if (!(comm_dim_partitioned(d) || (no_comms_fill && R[d])) ) continue;
       host_free(send[d]);
       host_free(recv[d]);
     }

   }

   void cpuGaugeField::exchangeExtendedGhost(const int *R, TimeProfile &profile, bool no_comms_fill) {
     profile.TPSTART(QUDA_PROFILE_COMMS);
     exchangeExtendedGhost(R, no_comms_fill);
     profile.TPSTOP(QUDA_PROFILE_COMMS);
   }

   // defined in cudaGaugeField
   void *create_gauge_buffer(size_t bytes, QudaGaugeFieldOrder order, QudaFieldGeometry geometry);
   void **create_ghost_buffer(size_t bytes[], QudaGaugeFieldOrder order, QudaFieldGeometry geometry);
   void free_gauge_buffer(void *buffer, QudaGaugeFieldOrder order, QudaFieldGeometry geometry);
   void free_ghost_buffer(void **buffer, QudaGaugeFieldOrder order, QudaFieldGeometry geometry);

   void cpuGaugeField::copy(const GaugeField &src) {
     if (this == &src) return;

     checkField(src);

     if (link_type == QUDA_ASQTAD_FAT_LINKS) {
       fat_link_max = src.LinkMax();
       if (precision == QUDA_HALF_PRECISION && fat_link_max == 0.0)
         errorQuda("fat_link_max has not been computed");
     } else {
       fat_link_max = 1.0;
     }

     if (typeid(src) == typeid(cudaGaugeField)) {

       if (reorder_location() == QUDA_CPU_FIELD_LOCATION) {

   if (!src.isNative()) errorQuda("Only native order is supported");
   void *buffer = pool_pinned_malloc(src.Bytes());
   // this copies over both even and odd
   qudaMemcpy(buffer, static_cast<const cudaGaugeField&>(src).Gauge_p(),
        src.Bytes(), cudaMemcpyDeviceToHost);

   copyGenericGauge(*this, src, QUDA_CPU_FIELD_LOCATION, gauge, buffer);
   pool_pinned_free(buffer);

       } else { // else on the GPU

   void *buffer = create_gauge_buffer(bytes, order, geometry);
   size_t ghost_bytes[8];
   int dstNinternal = reconstruct != QUDA_RECONSTRUCT_NO ? reconstruct : 2*nColor*nColor;
   for (int d=0; d<geometry; d++) ghost_bytes[d] = nFace * surface[d%4] * dstNinternal * precision;
   void **ghost_buffer = (nFace > 0) ? create_ghost_buffer(ghost_bytes, order, geometry) : nullptr;

   if (ghostExchange != QUDA_GHOST_EXCHANGE_EXTENDED) {
     copyGenericGauge(*this, src, QUDA_CUDA_FIELD_LOCATION, buffer, 0, ghost_buffer, 0);
     if (geometry == QUDA_COARSE_GEOMETRY) copyGenericGauge(*this, src, QUDA_CUDA_FIELD_LOCATION, buffer, 0, ghost_buffer, 0, 3); // forwards links if bi-directional
   } else {
     copyExtendedGauge(*this, src, QUDA_CUDA_FIELD_LOCATION, buffer, 0);
   }

   if (order == QUDA_QDP_GAUGE_ORDER) {
     for (int d=0; d<geometry; d++) {
       qudaMemcpy(((void**)gauge)[d], ((void**)buffer)[d], bytes/geometry, cudaMemcpyDeviceToHost);
     }
   } else {
     qudaMemcpy(gauge, buffer, bytes, cudaMemcpyHostToDevice);
   }

   if (order > 4 && ghostExchange == QUDA_GHOST_EXCHANGE_PAD && src.GhostExchange() == QUDA_GHOST_EXCHANGE_PAD && nFace)
     for (int d=0; d<geometry; d++)
       qudaMemcpy(Ghost()[d], ghost_buffer[d], ghost_bytes[d], cudaMemcpyDeviceToHost);

   free_gauge_buffer(buffer, order, geometry);
   if (nFace > 0) free_ghost_buffer(ghost_buffer, order, geometry);
       }

     } else if (typeid(src) == typeid(cpuGaugeField)) {
       // copy field and ghost zone directly
       copyGenericGauge(*this, src, QUDA_CPU_FIELD_LOCATION, gauge,
            const_cast<void*>(static_cast<const cpuGaugeField&>(src).Gauge_p()));
     } else {
       errorQuda("Invalid gauge field type");
     }

     // if we have copied from a source without a pad then we need to exchange
     if (ghostExchange == QUDA_GHOST_EXCHANGE_PAD &&
   src.GhostExchange() != QUDA_GHOST_EXCHANGE_PAD) {
       exchangeGhost(geometry == QUDA_VECTOR_GEOMETRY ? QUDA_LINK_BACKWARDS : QUDA_LINK_BIDIRECTIONAL);
     }

     checkCudaError();
   }

   void cpuGaugeField::setGauge(void **gauge_)
   {
     if(create != QUDA_REFERENCE_FIELD_CREATE) {
       errorQuda("Setting gauge pointer is only allowed when create="
     "QUDA_REFERENCE_FIELD_CREATE type\n");
     }
     gauge = gauge_;
   }

   void cpuGaugeField::backup() const {
     if (backed_up) errorQuda("Gauge field already backed up");

     if (order == QUDA_QDP_GAUGE_ORDER) {
       char **buffer = new char*[geometry];
       for (int d=0; d<geometry; d++) {
   buffer[d] = new char[bytes/geometry];
   memcpy(buffer[d], gauge[d], bytes/geometry);
       }
       backup_h = reinterpret_cast<char*>(buffer);
     } else {
       backup_h = new char[bytes];
       memcpy(backup_h, gauge, bytes);
     }

     backed_up = true;
   }

   void cpuGaugeField::restore() {
     if (!backed_up) errorQuda("Cannot restore since not backed up");

     if (order == QUDA_QDP_GAUGE_ORDER) {
       char **buffer = reinterpret_cast<char**>(backup_h);
       for (int d=0; d<geometry; d++) {
   memcpy(gauge[d], buffer[d], bytes/geometry);
   delete []buffer[d];
       }
       delete []buffer;
     } else {
       memcpy(gauge, backup_h, bytes);
       delete []backup_h;
     }

     backed_up = false;
   }

   void cpuGaugeField::zero() {
     memset(gauge, 0, bytes);
   }

 /*template <typename Float>
 void print_matrix(const Float &m, unsigned int x) {

   for (int s=0; s<o.Nspin(); s++) {
     std::cout << "x = " << x << ", s = " << s << ", { ";
     for (int c=0; c<o.Ncolor(); c++) {
       std::cout << " ( " << o(x, s, c, 0) << " , " ;
       if (c<o.Ncolor()-1) std::cout << o(x, s, c, 1) << " ) ," ;
       else std::cout << o(x, s, c, 1) << " ) " ;
     }
     std::cout << " } " << std::endl;
   }

 }

 // print out the vector at volume point x
 void cpuColorSpinorField::PrintMatrix(unsigned int x) {

   switch(precision) {
   case QUDA_DOUBLE_PRECISION:
     print_matrix(*order_double, x);
     break;
   case QUDA_SINGLE_PRECISION:
     print_matrix(*order_single, x);
     break;
   default:
     errorQuda("Precision %d not implemented", precision);
   }

 }
 */

 } // namespace quda
QUDA_BACKWARDS
Definition: enum_quda.h:414

qudaMemcpy
#define qudaMemcpy(dst, src, count, kind)
Definition: quda_cuda_api.h:32

QUDA_RECONSTRUCT_NO
Definition: enum_quda.h:66

quda::reorder_location
QudaFieldLocation reorder_location()
Return whether data is reordered on the CPU or GPU. This can set at QUDA initialization using the env...
Definition: lattice_field.cpp:585

quda::extractGaugeGhost
void extractGaugeGhost(const GaugeField &u, void **ghost, bool extract=true, int offset=0)
Definition: extract_gauge_ghost.cu:103

quda::LatticeField::backed_up
bool backed_up
Definition: lattice_field.h:322

QUDA_RECONSTRUCT_10
Definition: enum_quda.h:71

quda::cpuGaugeField::setGauge
void setGauge(void **_gauge)
Definition: cpu_gauge_field.cpp:333

quda::maxGauge
double maxGauge(const GaugeField &u)
Definition: max_gauge.cu:31

pool_pinned_free
#define pool_pinned_free(ptr)
Definition: malloc_quda.h:116

quda::copyGenericGauge
void copyGenericGauge(GaugeField &out, const GaugeField &in, QudaFieldLocation location, void *Out=0, void *In=0, void **ghostOut=0, void **ghostIn=0, int type=0)
Definition: copy_gauge.cu:38

quda::LatticeField::pad
int pad
Definition: lattice_field.h:132

quda::GaugeField::bytes
size_t bytes
Definition: gauge_field.h:126

src
const void * src
Definition: CMakeCUDACompilerId.cpp1.ii:2290

quda::cpuGaugeField::exchangeExtendedGhost
void exchangeExtendedGhost(const int *R, bool no_comms_fill=false)
This does routine will populate the border / halo region of a gauge field that has been created using...
Definition: cpu_gauge_field.cpp:186

QUDA_ASQTAD_MOM_LINKS
Definition: enum_quda.h:32

errorQuda
#define errorQuda(...)
Definition: util_quda.h:90

QUDA_BQCD_GAUGE_ORDER
Definition: enum_quda.h:46

quda::free_gauge_buffer
void free_gauge_buffer(void *buffer, QudaGaugeFieldOrder order, QudaFieldGeometry geometry)
Definition: cuda_gauge_field.cu:571

QUDA_CUDA_FIELD_LOCATION
Definition: enum_quda.h:297

host_free
#define host_free(ptr)
Definition: malloc_quda.h:59

QUDA_HALF_PRECISION
Definition: enum_quda.h:59

QUDA_QDP_GAUGE_ORDER
Definition: enum_quda.h:41

QudaLinkDirection
enum QudaLinkDirection_s QudaLinkDirection

quda::LatticeField::backup_h
char * backup_h
Definition: lattice_field.h:320

quda::free_ghost_buffer
void free_ghost_buffer(void **buffer, QudaGaugeFieldOrder order, QudaFieldGeometry geometry)
Definition: cuda_gauge_field.cu:580

quda::GaugeField::reconstruct
QudaReconstructType reconstruct
Definition: gauge_field.h:135

QUDA_LINK_BIDIRECTIONAL
Definition: enum_quda.h:422

QUDA_NULL_FIELD_CREATE
Definition: enum_quda.h:330

quda::LatticeField::x
int x[QUDA_MAX_DIM]
Definition: lattice_field.h:140

R
static int R[4]
Definition: interface_quda.cpp:83

quda::LatticeField::volume
int volume
Definition: lattice_field.h:126

QUDA_TIFR_PADDED_GAUGE_ORDER
Definition: enum_quda.h:48

QUDA_MILC_SITE_GAUGE_ORDER
Definition: enum_quda.h:45

QUDA_LINK_FORWARDS
Definition: enum_quda.h:421

quda::GaugeField::nFace
int nFace
Definition: gauge_field.h:132

quda
Definition: blas_cublas.h:6

quda::GaugeField::geometry
QudaFieldGeometry geometry
Definition: gauge_field.h:133

QUDA_REFERENCE_FIELD_CREATE
Definition: enum_quda.h:333

param
QudaGaugeParam param
Definition: pack_test.cpp:17

comm_free
void comm_free(MsgHandle *mh)
Definition: comm_mpi.cpp:252

quda::LatticeField::R
const int * R() const
Definition: lattice_field.h:452

quda::GaugeFieldParam
Definition: gauge_field.h:10

QUDA_GHOST_EXCHANGE_EXTENDED
Definition: enum_quda.h:436

quda::GaugeField::checkField
void checkField(const LatticeField &) const
Definition: gauge_field.cpp:236

comm_declare_send_relative
#define comm_declare_send_relative(buffer, dim, dir, nbytes)
Definition: comm_quda.h:59

QUDA_LINK_BACKWARDS
Definition: enum_quda.h:420

comm_declare_receive_relative
#define comm_declare_receive_relative(buffer, dim, dir, nbytes)
Definition: comm_quda.h:74

quda::LatticeField::mh_recv_back
MsgHandle * mh_recv_back[2][QUDA_MAX_DIM]
Definition: lattice_field.h:255

quda::cpuGaugeField::copy
void copy(const GaugeField &src)
Definition: cpu_gauge_field.cpp:259

QUDA_MILC_GAUGE_ORDER
Definition: enum_quda.h:44

quda::extractExtendedGaugeGhost
void extractExtendedGaugeGhost(const GaugeField &u, int dim, const int *R, void **ghost, bool extract)
Definition: extract_gauge_ghost_extended.cu:422

quda::cpuGaugeField
Definition: gauge_field.h:464

comm_start
void comm_start(MsgHandle *mh)
Definition: comm_mpi.cpp:260

fused_exterior_ndeg_tm_dslash_cuda_gen.i
int i
start here
Definition: fused_exterior_ndeg_tm_dslash_cuda_gen.py:816

quda::LatticeField::ghostExchange
QudaGhostExchange ghostExchange
Definition: lattice_field.h:155

quda::cudaGaugeField
Definition: gauge_field.h:298

quda::GaugeField::nInternal
int nInternal
Definition: gauge_field.h:136

QUDA_CPS_WILSON_GAUGE_ORDER
Definition: enum_quda.h:43

quda::GaugeField::exchange
void exchange(void **recv, void **send, QudaDirection dir) const
Exchange the buffers across all dimensions in a given direction.
Definition: gauge_field.cpp:156

quda::create_gauge_buffer
void * create_gauge_buffer(size_t bytes, QudaGaugeFieldOrder order, QudaFieldGeometry geometry)
Definition: cuda_gauge_field.cu:548

quda::cpuGaugeField::Gauge_p
void * Gauge_p()
Definition: gauge_field.h:526

quda::cpuGaugeField::restore
void restore()
Restores the cpuGaugeField.
Definition: cpu_gauge_field.cpp:360

quda::LatticeField::ghost_bytes
size_t ghost_bytes
Definition: lattice_field.h:206

quda::GaugeField::Ghost
const void ** Ghost() const
Definition: gauge_field.h:254

QudaGaugeFieldOrder
enum QudaGaugeFieldOrder_s QudaGaugeFieldOrder

quda::cpuGaugeField::injectGhost
void injectGhost(QudaLinkDirection link_direction=QUDA_LINK_BACKWARDS)
The opposite of exchangeGhost: take the ghost zone on x, send to node x-1, and inject back into the f...
Definition: cpu_gauge_field.cpp:167

quda::cpuGaugeField::~cpuGaugeField
virtual ~cpuGaugeField()
Definition: cpu_gauge_field.cpp:99

quda::LatticeField::nDim
int nDim
Definition: lattice_field.h:137

quda::cpuGaugeField::gauge
void ** gauge
Definition: gauge_field.h:471

memcpy
void * memcpy(void *__dst, const void *__src, size_t __n)

QUDA_VECTOR_GEOMETRY
Definition: enum_quda.h:427

safe_malloc
#define safe_malloc(size)
Definition: malloc_quda.h:54

quda::LatticeField::mh_send_fwd
MsgHandle * mh_send_fwd[2][QUDA_MAX_DIM]
Definition: lattice_field.h:258

QUDA_TIFR_GAUGE_ORDER
Definition: enum_quda.h:47

quda::cpuGaugeField::cpuGaugeField
cpuGaugeField(const GaugeFieldParam &param)
Constructor for cpuGaugeField from a GaugeFieldParam.
Definition: cpu_gauge_field.cpp:9

memset
void * memset(void *__b, int __c, size_t __len)

quda::LatticeField::surface
int surface[QUDA_MAX_DIM]
Definition: lattice_field.h:142

pool_pinned_malloc
#define pool_pinned_malloc(size)
Definition: malloc_quda.h:115

quda::cpuGaugeField::backup
void backup() const
Backs up the cpuGaugeField.
Definition: cpu_gauge_field.cpp:342

quda::cpuGaugeField::exchangeGhost
void exchangeGhost(QudaLinkDirection link_direction=QUDA_LINK_BACKWARDS)
Exchange the ghost and store store in the padded region.
Definition: cpu_gauge_field.cpp:134

quda::create_ghost_buffer
void ** create_ghost_buffer(size_t bytes[], QudaGaugeFieldOrder order, QudaFieldGeometry geometry)
Definition: cuda_gauge_field.cu:559

quda::GaugeField::link_type
QudaLinkType link_type
Definition: gauge_field.h:139

quda::cpuGaugeField::zero
void zero()
Definition: cpu_gauge_field.cpp:378

quda::GaugeField::create
QudaFieldCreate create
Definition: gauge_field.h:147

quda::GaugeField::nColor
int nColor
Definition: gauge_field.h:131

quda::TimeProfile
Definition: quda_internal.h:232

QUDA_FORWARDS
Definition: enum_quda.h:415

quda::GaugeField::fat_link_max
double fat_link_max
Definition: gauge_field.h:144

QudaFieldGeometry
enum QudaFieldGeometry_s QudaFieldGeometry

quda::GaugeField::site_size
size_t site_size
Definition: gauge_field.h:184

QUDA_COARSE_GEOMETRY
Definition: enum_quda.h:429

QUDA_MAX_DIM
#define QUDA_MAX_DIM
Maximum number of dimensions supported by QUDA. In practice, no routines make use of more than 5...
Definition: quda_constants.h:17

checkCudaError
#define checkCudaError()
Definition: util_quda.h:129

quda::LatticeField::mh_recv_fwd
MsgHandle * mh_recv_fwd[2][QUDA_MAX_DIM]
Definition: lattice_field.h:252

QUDA_SCALAR_GEOMETRY
Definition: enum_quda.h:426

QUDA_ZERO_FIELD_CREATE
Definition: enum_quda.h:331

comm_wait
void comm_wait(MsgHandle *mh)
Definition: comm_mpi.cpp:266

quda::GaugeField::order
QudaGaugeFieldOrder order
Definition: gauge_field.h:137

QUDA_GHOST_EXCHANGE_PAD
Definition: enum_quda.h:435

d
static __inline__ size_t size_t d
Definition: CMakeCUDACompilerId.cpp1.ii:3019

quda::GaugeField::ghost
void * ghost[2 *QUDA_MAX_DIM]
Definition: gauge_field.h:149

QUDA_TENSOR_GEOMETRY
Definition: enum_quda.h:428

QUDA_CPU_FIELD_LOCATION
Definition: enum_quda.h:296

quda::LatticeField::precision
QudaPrecision precision
Definition: lattice_field.h:149

quda::LatticeField::mh_send_back
MsgHandle * mh_send_back[2][QUDA_MAX_DIM]
Definition: lattice_field.h:261

QUDA_ASQTAD_FAT_LINKS
Definition: enum_quda.h:30

gauge_field.h

quda::copyExtendedGauge
void copyExtendedGauge(GaugeField &out, const GaugeField &in, QudaFieldLocation location, void *Out=0, void *In=0)
Definition: copy_gauge_extended.cu:321

MsgHandle_s
Definition: comm_mpi.cpp:22

quda::blas::bytes
unsigned long long bytes
Definition: blas_quda.cu:43

comm_dim_partitioned
int comm_dim_partitioned(int dim)
Definition: comm_common.cpp:597

quda::QUDA_PROFILE_COMMS
Definition: quda_internal.h:173

quda_internal.h

quda::GaugeField
Definition: gauge_field.h:123