quda-ref/v1.0.0/copy__gauge__mg_8cu_source.html

 #include <gauge_field_order.h>

 #define FINE_GRAINED_ACCESS

 #include <copy_gauge_helper.cuh>

 namespace quda {

   template <typename sFloatOut, typename sFloatIn, int Nc, typename InOrder>
   void copyGaugeMG(const InOrder &inOrder, GaugeField &out, const GaugeField &in,
        QudaFieldLocation location, sFloatOut *Out, sFloatOut **outGhost, int type) {

     typedef typename mapper<sFloatOut>::type FloatOut;
     typedef typename mapper<sFloatIn>::type FloatIn;
     constexpr int length = 2*Nc*Nc;

     if (out.Reconstruct() != QUDA_RECONSTRUCT_NO)
       errorQuda("Reconstruct type %d not supported", out.Reconstruct());

 #ifdef FINE_GRAINED_ACCESS
     if (out.Precision() == QUDA_HALF_PRECISION) {
       if (in.Precision() == QUDA_HALF_PRECISION) {
   out.Scale(in.Scale());
       } else {
   InOrder in_(const_cast<GaugeField&>(in));
   out.Scale( in.abs_max() );
       }
     }
 #endif

     if (out.isNative()) {

 #ifdef FINE_GRAINED_ACCESS
       if (outGhost) {
   typedef typename gauge::FieldOrder<FloatOut,Nc,1,QUDA_FLOAT2_GAUGE_ORDER,false,sFloatOut> G;
   copyGauge<FloatOut,FloatIn,length>(G(out,(void*)Out,(void**)outGhost), inOrder, out, in, location, type);
       } else {
   typedef typename gauge::FieldOrder<FloatOut,Nc,1,QUDA_FLOAT2_GAUGE_ORDER,true,sFloatOut> G;
   copyGauge<FloatOut,FloatIn,length>(G(out,(void*)Out,(void**)outGhost), inOrder, out, in, location, type);
       }
 #else
       typedef typename gauge_mapper<FloatOut,QUDA_RECONSTRUCT_NO,length>::type G;
       copyGauge<FloatOut,FloatIn,length>
   (G(out,Out,outGhost), inOrder, out, in, location, type);
 #endif

     } else if (out.Order() == QUDA_QDP_GAUGE_ORDER) {

 #ifdef FINE_GRAINED_ACCESS
       typedef typename gauge::FieldOrder<FloatOut,Nc,1,QUDA_QDP_GAUGE_ORDER,true,sFloatOut> G;
       copyGauge<FloatOut,FloatIn,length>(G(out,(void*)Out,(void**)outGhost), inOrder, out, in, location, type);
 #else
       typedef typename QDPOrder<FloatOut,length> G;
       copyGauge<FloatOut,FloatIn,length>(G(out, Out, outGhost), inOrder, out, in, location, type);
 #endif

     } else if (out.Order() == QUDA_MILC_GAUGE_ORDER) {

 #ifdef FINE_GRAINED_ACCESS
       typedef typename gauge::FieldOrder<FloatOut,Nc,1,QUDA_MILC_GAUGE_ORDER,true,sFloatOut> G;
       copyGauge<FloatOut,FloatIn,length>(G(out,(void*)Out,(void**)outGhost), inOrder, out, in, location, type);
 #else
       typedef typename MILCOrder<FloatOut,length> G;
       copyGauge<FloatOut,FloatIn,length>(G(out, Out, outGhost), inOrder, out, in, location, type);
 #endif

     } else {
       errorQuda("Gauge field %d order not supported", out.Order());
     }

   }

   template <typename sFloatOut, typename sFloatIn, int Nc>
     void copyGaugeMG(GaugeField &out, const GaugeField &in, QudaFieldLocation location,
          sFloatOut *Out, sFloatIn *In, sFloatOut **outGhost, sFloatIn **inGhost, int type) {

     typedef typename mapper<sFloatOut>::type FloatOut;
     typedef typename mapper<sFloatIn>::type FloatIn;
 #ifndef FINE_GRAINED_ACCESS
     constexpr int length = 2*Nc*Nc;
 #endif

     if (in.Reconstruct() != QUDA_RECONSTRUCT_NO)
       errorQuda("Reconstruct type %d not supported", in.Reconstruct());

     if (in.isNative()) {
 #ifdef FINE_GRAINED_ACCESS
       if (inGhost) {
   typedef typename gauge::FieldOrder<FloatIn,Nc,1,QUDA_FLOAT2_GAUGE_ORDER,false,sFloatIn> G;
   copyGaugeMG<sFloatOut,sFloatIn,Nc> (G(const_cast<GaugeField&>(in),(void*)In,(void**)inGhost), out, in, location, Out, outGhost, type);
       } else {
   typedef typename gauge::FieldOrder<FloatIn,Nc,1,QUDA_FLOAT2_GAUGE_ORDER,true,sFloatIn> G;
   copyGaugeMG<sFloatOut,sFloatIn,Nc> (G(const_cast<GaugeField&>(in),(void*)In,(void**)inGhost), out, in, location, Out, outGhost, type);
       }
 #else
       typedef typename gauge_mapper<FloatIn,QUDA_RECONSTRUCT_NO,length>::type G;
       copyGaugeMG<FloatOut,FloatIn,Nc> (G(in, In,inGhost), out, in, location, Out, outGhost, type);
 #endif
     } else if (in.Order() == QUDA_QDP_GAUGE_ORDER) {

 #ifdef FINE_GRAINED_ACCESS
       typedef typename gauge::FieldOrder<FloatIn,Nc,1,QUDA_QDP_GAUGE_ORDER,true,sFloatIn> G;
       copyGaugeMG<sFloatOut,sFloatIn,Nc>(G(const_cast<GaugeField&>(in),(void*)In,(void**)inGhost), out, in, location, Out, outGhost, type);
 #else
       typedef typename QDPOrder<FloatIn,length> G;
       copyGaugeMG<FloatOut,FloatIn,Nc>(G(in, In, inGhost), out, in, location, Out, outGhost, type);
 #endif

     } else if (in.Order() == QUDA_MILC_GAUGE_ORDER) {

 #ifdef FINE_GRAINED_ACCESS
       typedef typename gauge::FieldOrder<FloatIn,Nc,1,QUDA_MILC_GAUGE_ORDER,true,sFloatIn> G;
       copyGaugeMG<sFloatOut,sFloatIn,Nc>(G(const_cast<GaugeField&>(in),(void*)In,(void**)inGhost), out, in, location, Out, outGhost, type);
 #else
       typedef typename MILCOrder<FloatIn,length> G;
       copyGaugeMG<FloatOut,FloatIn,Nc>(G(in, In, inGhost), out, in, location, Out, outGhost, type);
 #endif

     } else {
       errorQuda("Gauge field %d order not supported", in.Order());
     }

   }

   template <typename FloatOut, typename FloatIn>
   void copyGaugeMG(GaugeField &out, const GaugeField &in, QudaFieldLocation location, FloatOut *Out,
        FloatIn *In, FloatOut **outGhost, FloatIn **inGhost, int type) {

     switch(in.Ncolor()) {
 #ifdef GPU_MULTIGRID
     case  8: copyGaugeMG<FloatOut,FloatIn, 8>(out, in, location, Out, In, outGhost, inGhost, type); break;
     case 12: copyGaugeMG<FloatOut,FloatIn,12>(out, in, location, Out, In, outGhost, inGhost, type); break;
     case 16: copyGaugeMG<FloatOut,FloatIn,16>(out, in, location, Out, In, outGhost, inGhost, type); break;
     case 24: copyGaugeMG<FloatOut,FloatIn,24>(out, in, location, Out, In, outGhost, inGhost, type); break;
     case 32: copyGaugeMG<FloatOut,FloatIn,32>(out, in, location, Out, In, outGhost, inGhost, type); break;
     case 40: copyGaugeMG<FloatOut,FloatIn,40>(out, in, location, Out, In, outGhost, inGhost, type); break;
     case 48: copyGaugeMG<FloatOut,FloatIn,48>(out, in, location, Out, In, outGhost, inGhost, type); break;
     case 56: copyGaugeMG<FloatOut,FloatIn,56>(out, in, location, Out, In, outGhost, inGhost, type); break;
     case 64: copyGaugeMG<FloatOut,FloatIn,64>(out, in, location, Out, In, outGhost, inGhost, type); break;
 #endif // GPU_MULTIGRID
     default: errorQuda("Unsupported number of colors; out.Nc=%d, in.Nc=%d", out.Ncolor(), in.Ncolor());
     }
   }

   // this is the function that is actually called, from here on down we instantiate all required templates
   void copyGenericGaugeMG(GaugeField &out, const GaugeField &in, QudaFieldLocation location,
         void *Out, void *In, void **ghostOut, void **ghostIn, int type) {

 #ifndef FINE_GRAINED_ACCESS
     if (out.Precision() == QUDA_HALF_PRECISION || in.Precision() == QUDA_HALF_PRECISION)
       errorQuda("Precision format not supported");
 #endif

     if (out.Precision() == QUDA_DOUBLE_PRECISION) {
 #ifdef GPU_MULTIGRID_DOUBLE
       if (in.Precision() == QUDA_DOUBLE_PRECISION) {
   copyGaugeMG(out, in, location, (double*)Out, (double*)In, (double**)ghostOut, (double**)ghostIn, type);
       } else if (in.Precision() == QUDA_SINGLE_PRECISION) {
   copyGaugeMG(out, in, location, (double*)Out, (float*)In, (double**)ghostOut, (float**)ghostIn, type);
       } else if (in.Precision() == QUDA_HALF_PRECISION) {
   copyGaugeMG(out, in, location, (double*)Out, (short*)In, (double**)ghostOut, (short**)ghostIn, type);
       } else {
   errorQuda("Precision %d not supported", in.Precision());
       }
 #else
       errorQuda("Double precision multigrid has not been enabled");
 #endif
     } else if (out.Precision() == QUDA_SINGLE_PRECISION) {
       if (in.Precision() == QUDA_DOUBLE_PRECISION) {
 #ifdef GPU_MULTIGRID_DOUBLE
   copyGaugeMG(out, in, location, (float*)Out, (double*)In, (float**)ghostOut, (double**)ghostIn, type);
 #else
   errorQuda("Double precision multigrid has not been enabled");
 #endif
       } else if (in.Precision() == QUDA_SINGLE_PRECISION) {
   copyGaugeMG(out, in, location, (float*)Out, (float*)In, (float**)ghostOut, (float**)ghostIn, type);
       } else if (in.Precision() == QUDA_HALF_PRECISION) {
   copyGaugeMG(out, in, location, (float*)Out, (short*)In, (float**)ghostOut, (short**)ghostIn, type);
       } else {
   errorQuda("Precision %d not supported", in.Precision());
       }
     } else if (out.Precision() == QUDA_HALF_PRECISION) {
       if (in.Precision() == QUDA_DOUBLE_PRECISION) {
 #ifdef GPU_MULTIGRID_DOUBLE
   copyGaugeMG(out, in, location, (short*)Out, (double*)In, (short**)ghostOut, (double**)ghostIn, type);
 #else
   errorQuda("Double precision multigrid has not been enabled");
 #endif
       } else if (in.Precision() == QUDA_SINGLE_PRECISION) {
   copyGaugeMG(out, in, location, (short*)Out, (float*)In, (short**)ghostOut, (float**)ghostIn, type);
       } else if (in.Precision() == QUDA_HALF_PRECISION) {
   copyGaugeMG(out, in, location, (short*)Out, (short*)In, (short**)ghostOut, (short**)ghostIn, type);
       } else {
   errorQuda("Precision %d not supported", in.Precision());
       }
     } else {
       errorQuda("Precision %d not supported", out.Precision());
     }
   }


 } // namespace quda
QUDA_RECONSTRUCT_NO
Definition: enum_quda.h:67

quda::gauge::MILCOrder
Definition: gauge_field_order.h:2332

errorQuda
#define errorQuda(...)
Definition: util_quda.h:121

QUDA_HALF_PRECISION
Definition: enum_quda.h:60

QUDA_QDP_GAUGE_ORDER
Definition: enum_quda.h:41

quda::LatticeField::Scale
double Scale() const
Definition: lattice_field.h:556

quda::GaugeField::abs_max
double abs_max(int dim=-1) const
Compute the absolute maximum of the field (Linfinity norm)
Definition: max_gauge.cu:84

copy_gauge_helper.cuh

length
int length[]
Definition: gauge_force_test.cpp:34

quda
Definition: blas_cublas.h:5

quda::gauge::FieldOrder
Definition: gauge_field_order.h:896

quda::GaugeField::Ncolor
int Ncolor() const
Definition: gauge_field.h:249

quda::copyGaugeMG
void copyGaugeMG(const InOrder &inOrder, GaugeField &out, const GaugeField &in, QudaFieldLocation location, sFloatOut *Out, sFloatOut **outGhost, int type)
Definition: copy_gauge_mg.cu:10

QUDA_MILC_GAUGE_ORDER
Definition: enum_quda.h:44

in
cpuColorSpinorField * in
Definition: staggered_invert_test.cpp:98

gauge_field_order.h
Main header file for host and device accessors to GaugeFields.

quda::clover::QDPOrder
Definition: clover_field_order.h:800

QUDA_DOUBLE_PRECISION
Definition: enum_quda.h:62

QudaFieldLocation
enum QudaFieldLocation_s QudaFieldLocation

out
cpuColorSpinorField * out
Definition: staggered_invert_test.cpp:99

QUDA_SINGLE_PRECISION
Definition: enum_quda.h:61

quda::mapper
Definition: register_traits.h:43

quda::gauge_mapper
Definition: gauge_field_order.h:3012

quda::copyGenericGaugeMG
void copyGenericGaugeMG(GaugeField &out, const GaugeField &in, QudaFieldLocation location, void *Out, void *In, void **ghostOut, void **ghostIn, int type)
Definition: copy_gauge_mg.cu:146

quda::GaugeField::Reconstruct
QudaReconstructType Reconstruct() const
Definition: gauge_field.h:250

quda::GaugeField::Order
QudaGaugeFieldOrder Order() const
Definition: gauge_field.h:251

quda::LatticeField::Precision
QudaPrecision Precision() const
Definition: lattice_field.h:546

quda::GaugeField::isNative
bool isNative() const
Definition: gauge_field.cpp:167

quda::GaugeField
Definition: gauge_field.h:164