v0.9.0/doc/transfer_8cpp_source.html

 #include <transfer.h>
 #include <blas_quda.h>

 #include <transfer.h>
 #include <multigrid.h>
 #include <malloc_quda.h>

 #include <iostream>
 #include <algorithm>
 #include <vector>

 #include <nvToolsExt.h>

 namespace quda {

   /*
   * for the staggered case, there is no spin blocking,
   * however we do even-odd to preserve chirality (that is straightforward)
   */

   Transfer::Transfer(const std::vector<ColorSpinorField*> &B, int Nvec, int *geo_bs, int spin_bs, bool enable_gpu, TimeProfile &profile)
     : B(B), Nvec(Nvec), V_h(0), V_d(0), fine_tmp_h(0), fine_tmp_d(0), coarse_tmp_h(0), coarse_tmp_d(0), geo_bs(0),
       fine_to_coarse_h(0), coarse_to_fine_h(0),
       fine_to_coarse_d(0), coarse_to_fine_d(0),
       spin_bs(spin_bs), spin_map(0), site_subset(QUDA_FULL_SITE_SUBSET), parity(QUDA_INVALID_PARITY),
       enable_gpu(enable_gpu), use_gpu(enable_gpu), // by default we apply the transfer operator according to enable_gpu flag but can be overridden
       flops_(0), profile(profile)
   {
     int ndim = B[0]->Ndim();

     for (int d = 0; d < ndim; d++) {
       while (geo_bs[d] > 0) {
   if (d==0 && B[0]->X(0) == geo_bs[0])
     warningQuda("X-dimension length %d cannot block length %d", B[0]->X(0), geo_bs[0]);
   else if ( (B[0]->X(d)/geo_bs[d]+1)%2 == 0)
     warningQuda("Indexing does not (yet) support odd coarse dimensions: X(%d) = %d", d, B[0]->X(d)/geo_bs[d]);
   else if ( (B[0]->X(d)/geo_bs[d]) * geo_bs[d] != B[0]->X(d) )
     warningQuda("cannot block dim[%d]=%d with block size = %d", d, B[0]->X(d), geo_bs[d]);
   else
     break; // this is a valid block size so let's use it
   geo_bs[d] /= 2;
       }
       if (geo_bs[d] == 0) errorQuda("Unable to block dimension %d", d);
     }

     this->geo_bs = new int[ndim];
     int total_block_size = 1;
     for (int d = 0; d < ndim; d++) {
       this->geo_bs[d] = geo_bs[d];
       total_block_size *= geo_bs[d];
     }

     if (total_block_size == 1) errorQuda("Total geometric block size is 1");

     char block_str[128];
     sprintf(block_str, "%d", geo_bs[0]);
     for (int d=1; d<ndim; d++) sprintf(block_str, "%s x %d", block_str, geo_bs[d]);
     printfQuda("Transfer: using block size %s\n", block_str);

     // create the storage for the final block orthogonal elements
     ColorSpinorParam param(*B[0]); // takes the geometry from the null-space vectors

     // the ordering of the V vector is defined by these parameters and
     // the Packed functions in ColorSpinorFieldOrder

     param.nSpin = B[0]->Nspin(); // spin has direct mapping
     param.nColor = B[0]->Ncolor()*Nvec; // nColor = number of colors * number of vectors
     param.create = QUDA_ZERO_FIELD_CREATE;
     // the V field is defined on all sites regardless of B field (maybe the B fields are always full?)
     if (param.siteSubset == QUDA_PARITY_SITE_SUBSET) {
       //keep it the same for staggered:
       param.siteSubset = QUDA_FULL_SITE_SUBSET;
       param.x[0] *= 2;
     }

     if (getVerbosity() >= QUDA_VERBOSE) printfQuda("Transfer: creating V field with location %d\n", param.location);

     // for cpu transfer this is the V field, for gpu it's just a temporary until we port the block orthogonalization
     V_h = ColorSpinorField::Create(param);

     param.location = QUDA_CUDA_FIELD_LOCATION;
     param.fieldOrder = QUDA_FLOAT2_FIELD_ORDER;//ok for staggered

     V_d = enable_gpu ? ColorSpinorField::Create(param) : 0;

     printfQuda("Transfer: filling V field with zero\n");
     fillV(*V_h); // copy the null space vectors into V

     param = ColorSpinorParam(*B[0]);

     // used for cpu<->gpu transfers
     param.create = QUDA_NULL_FIELD_CREATE;
     fine_tmp_h = ColorSpinorField::Create(param);

     // useful to have around
     coarse_tmp_h = fine_tmp_h->CreateCoarse(geo_bs, spin_bs, Nvec);

     // create temporaries we use to enable us to change basis and for cpu<->gpu transfers
     if (enable_gpu) {
       param = ColorSpinorParam(*B[0]);
       param.location = QUDA_CUDA_FIELD_LOCATION;
       param.fieldOrder = QUDA_FLOAT2_FIELD_ORDER;
       param.create = QUDA_NULL_FIELD_CREATE;
       fine_tmp_d = ColorSpinorField::Create(param);

       // used for basis changing
       coarse_tmp_d = fine_tmp_d->CreateCoarse(geo_bs, spin_bs, Nvec);
     }

     // allocate and compute the fine-to-coarse and coarse-to-fine site maps
     fine_to_coarse_h = static_cast<int*>(safe_malloc(B[0]->Volume()*sizeof(int)));
     coarse_to_fine_h = static_cast<int*>(safe_malloc(B[0]->Volume()*sizeof(int)));

     if (enable_gpu) {
       fine_to_coarse_d = static_cast<int*>(device_malloc(B[0]->Volume()*sizeof(int)));
       coarse_to_fine_d = static_cast<int*>(device_malloc(B[0]->Volume()*sizeof(int)));
     }

     createGeoMap(geo_bs);

     // allocate the fine-to-coarse spin map (don't need it for staggered.)
     if (param.nSpin != 1){
       spin_map = static_cast<int*>(safe_malloc(B[0]->Nspin()*sizeof(int)));
       createSpinMap(spin_bs);
     }

     // orthogonalize the blocks
     printfQuda("Transfer: block orthogonalizing\n");
     BlockOrthogonalize(*V_h, Nvec, geo_bs, fine_to_coarse_h, spin_bs);

     if (enable_gpu) {
       *V_d = *V_h;
       printfQuda("Transferred prolongator to GPU\n");
     }
   }

   Transfer::~Transfer() {
     if (spin_map) host_free(spin_map);
     if (coarse_to_fine_d) device_free(coarse_to_fine_d);
     if (fine_to_coarse_d) device_free(fine_to_coarse_d);
     if (coarse_to_fine_h) host_free(coarse_to_fine_h);
     if (fine_to_coarse_h) host_free(fine_to_coarse_h);
     if (V_h) delete V_h;
     if (V_d) delete V_d;

     if (fine_tmp_h) delete fine_tmp_h;
     if (fine_tmp_d) delete fine_tmp_d;

     if (coarse_tmp_h) delete coarse_tmp_h;
     if (coarse_tmp_d) delete coarse_tmp_d;

     if (geo_bs) delete []geo_bs;
   }

   void Transfer::setSiteSubset(QudaSiteSubset site_subset_, QudaParity parity_) {
     if (parity_ != QUDA_EVEN_PARITY && parity_ != QUDA_ODD_PARITY) errorQuda("Undefined parity %d", parity_);
     parity = parity_;

     if (site_subset == site_subset_) return;
     site_subset = site_subset_;

     // this function only does something non-trivial if the operator is on the GPU
     if (!enable_gpu) return;

     if (site_subset == QUDA_PARITY_SITE_SUBSET) {
       // if doing single-parity then delete full field V and replace with single parity

       delete V_d;

       ColorSpinorParam param(*V_h);
       param.location = QUDA_CUDA_FIELD_LOCATION;
       param.fieldOrder = QUDA_FLOAT2_FIELD_ORDER;
       param.x[0] /= 2;
       param.siteSubset = QUDA_PARITY_SITE_SUBSET;

       V_d = ColorSpinorField::Create(param);
       *V_d = parity == QUDA_EVEN_PARITY ? V_h->Even() : V_h->Odd();

     } else if (site_subset == QUDA_FULL_SITE_SUBSET) {
       // if doing full field then delete single parity V and replace with single parity

       delete V_d;

       ColorSpinorParam param(*V_h);
       param.location = QUDA_CUDA_FIELD_LOCATION;
       param.fieldOrder = QUDA_FLOAT2_FIELD_ORDER;

       V_d = ColorSpinorField::Create(param);
       *V_d = *V_h;

     } else {
       errorQuda("Undefined site_subset %d", site_subset_);
     }

   }

   void Transfer::fillV(ColorSpinorField &V) {
     FillV(V, B, Nvec);  //printfQuda("V fill check %e\n", norm2(*V));
   }

   struct Int2 {
     int x, y;
     Int2() : x(0), y(0) { }
     Int2(int x, int y) : x(x), y(y) { }

     bool operator<(const Int2 &a) const {
       return (x < a.x) ? true : (x==a.x && y<a.y) ? true : false;
     }
   };

   // compute the fine-to-coarse site map
   void Transfer::createGeoMap(int *geo_bs) {

     int x[QUDA_MAX_DIM];

     ColorSpinorField &fine(*fine_tmp_h);
     ColorSpinorField &coarse(*coarse_tmp_h);

     // compute the coarse grid point for every site (assuming parity ordering currently)
     for (int i=0; i<fine.Volume(); i++) {
       // compute the lattice-site index for this offset index
       fine.LatticeIndex(x, i);

       //printfQuda("fine idx %d = fine (%d,%d,%d,%d), ", i, x[0], x[1], x[2], x[3]);

       // compute the corresponding coarse-grid index given the block size
       for (int d=0; d<fine.Ndim(); d++) x[d] /= geo_bs[d];

       // compute the coarse-offset index and store in fine_to_coarse
       int k;
       coarse.OffsetIndex(k, x); // this index is parity ordered
       fine_to_coarse_h[i] = k;

       //printfQuda("coarse after (%d,%d,%d,%d), coarse idx %d\n", x[0], x[1], x[2], x[3], k);
     }

     // now create an inverse-like variant of this

     std::vector<Int2> geo_sort(B[0]->Volume());
     for (unsigned int i=0; i<geo_sort.size(); i++) geo_sort[i] = Int2(fine_to_coarse_h[i], i);
     std::sort(geo_sort.begin(), geo_sort.end());
     for (unsigned int i=0; i<geo_sort.size(); i++) coarse_to_fine_h[i] = geo_sort[i].y;

     if (enable_gpu) {
       qudaMemcpy(fine_to_coarse_d, fine_to_coarse_h, B[0]->Volume()*sizeof(int), cudaMemcpyHostToDevice);
       qudaMemcpy(coarse_to_fine_d, coarse_to_fine_h, B[0]->Volume()*sizeof(int), cudaMemcpyHostToDevice);
       checkCudaError();
     }

   }

   // compute the fine spin to coarse spin map
   void Transfer::createSpinMap(int spin_bs) {

     for (int s=0; s<B[0]->Nspin(); s++) {
       spin_map[s] = s / spin_bs;
     }

   }

   // apply the prolongator
   void Transfer::P(ColorSpinorField &out, const ColorSpinorField &in) const {
     profile.TPSTART(QUDA_PROFILE_COMPUTE);

     ColorSpinorField *input = const_cast<ColorSpinorField*>(&in);
     ColorSpinorField *output = &out;
     const ColorSpinorField *V = use_gpu ? V_d : V_h;
     const int *fine_to_coarse = use_gpu ? fine_to_coarse_d : fine_to_coarse_h;

     if (use_gpu) {
       if (in.Location() == QUDA_CPU_FIELD_LOCATION) input = coarse_tmp_d;
       if (out.Location() == QUDA_CPU_FIELD_LOCATION ||  out.GammaBasis() != V->GammaBasis())
   output = (out.SiteSubset() == QUDA_FULL_SITE_SUBSET) ? fine_tmp_d : &fine_tmp_d->Even();
       if (!enable_gpu) errorQuda("not created with enable_gpu set, so cannot run on GPU");
     } else {
       if (out.Location() == QUDA_CUDA_FIELD_LOCATION)
   output = (out.SiteSubset() == QUDA_FULL_SITE_SUBSET) ? fine_tmp_h : &fine_tmp_h->Even();
     }

     *input = in; // copy result to input field (aliasing handled automatically)

     if (V->SiteSubset() == QUDA_PARITY_SITE_SUBSET && out.SiteSubset() == QUDA_FULL_SITE_SUBSET)
       errorQuda("Cannot prolongate to a full field since only have single parity null-space components");

     if ((V->Nspin() != 1) && ((output->GammaBasis() != V->GammaBasis()) || (input->GammaBasis() != V->GammaBasis()))){
       errorQuda("Cannot apply prolongator using fields in a different basis from the null space (%d,%d) != %d",
     output->GammaBasis(), in.GammaBasis(), V->GammaBasis());
     }

     Prolongate(*output, *input, *V, Nvec, fine_to_coarse, spin_map, parity);

     out = *output; // copy result to out field (aliasing handled automatically)

     flops_ += 8*in.Ncolor()*out.Ncolor()*out.VolumeCB()*out.SiteSubset();

     profile.TPSTOP(QUDA_PROFILE_COMPUTE);
   }

   // apply the restrictor
   void Transfer::R(ColorSpinorField &out, const ColorSpinorField &in) const {

     profile.TPSTART(QUDA_PROFILE_COMPUTE);

     ColorSpinorField *input = &const_cast<ColorSpinorField&>(in);
     ColorSpinorField *output = &out;
     const ColorSpinorField *V = use_gpu ? V_d : V_h;
     const int *fine_to_coarse = use_gpu ? fine_to_coarse_d : fine_to_coarse_h;
     const int *coarse_to_fine = use_gpu ? coarse_to_fine_d : coarse_to_fine_h;

     if (use_gpu) {
       if (out.Location() == QUDA_CPU_FIELD_LOCATION) output = coarse_tmp_d;
       if (in.Location() == QUDA_CPU_FIELD_LOCATION || in.GammaBasis() != V->GammaBasis())
   input = (in.SiteSubset() == QUDA_FULL_SITE_SUBSET) ? fine_tmp_d : &fine_tmp_d->Even();
       if (!enable_gpu) errorQuda("not created with enable_gpu set, so cannot run on GPU");
     } else {
       if (in.Location() == QUDA_CUDA_FIELD_LOCATION)
   input = (in.SiteSubset() == QUDA_FULL_SITE_SUBSET) ? fine_tmp_h : &fine_tmp_h->Even();
     }

     *input = in;

     if (V->SiteSubset() == QUDA_PARITY_SITE_SUBSET && in.SiteSubset() == QUDA_FULL_SITE_SUBSET)
       errorQuda("Cannot restrict a full field since only have single parity null-space components");

     if ( V->Nspin() != 1 && ( output->GammaBasis() != V->GammaBasis() || input->GammaBasis() != V->GammaBasis() ) )
       errorQuda("Cannot apply restrictor using fields in a different basis from the null space (%d,%d) != %d",
     out.GammaBasis(), input->GammaBasis(), V->GammaBasis());

     Restrict(*output, *input, *V, Nvec, fine_to_coarse, coarse_to_fine, spin_map, parity);

     out = *output; // copy result to out field (aliasing handled automatically)

     // only need to synchronize if we're transferring from GPU to CPU
     if (out.Location() == QUDA_CPU_FIELD_LOCATION && in.Location() == QUDA_CUDA_FIELD_LOCATION)
       qudaDeviceSynchronize();

     flops_ += 8*out.Ncolor()*in.Ncolor()*in.VolumeCB()*in.SiteSubset();

     profile.TPSTOP(QUDA_PROFILE_COMPUTE);
   }

   double Transfer::flops() const {
     double rtn = flops_;
     flops_ = 0;
     return rtn;
   }

 } // namespace quda
QUDA_VERBOSE
Definition: enum_quda.h:237

qudaMemcpy
#define qudaMemcpy(dst, src, count, kind)
Definition: quda_cuda_api.h:32

quda::Transfer::enable_gpu
bool enable_gpu
Definition: transfer.h:96

quda::ColorSpinorField::OffsetIndex
void OffsetIndex(int &i, int *y) const
Definition: color_spinor_field.cpp:723

quda::Transfer::profile
TimeProfile & profile
Definition: transfer.h:156

quda::Transfer::Nvec
const int Nvec
Definition: transfer.h:38

QUDA_INVALID_PARITY
Definition: enum_quda.h:261

quda::ColorSpinorField
Definition: color_spinor_field.h:271

getVerbosity
QudaVerbosity getVerbosity()
Definition: util_quda.cpp:20

errorQuda
#define errorQuda(...)
Definition: util_quda.h:90

quda::Transfer::R
void R(ColorSpinorField &out, const ColorSpinorField &in) const
Definition: transfer.cpp:300

QUDA_CUDA_FIELD_LOCATION
Definition: enum_quda.h:297

host_free
#define host_free(ptr)
Definition: malloc_quda.h:59

QUDA_ODD_PARITY
Definition: enum_quda.h:260

quda::Transfer::spin_bs
int spin_bs
Definition: transfer.h:84

QUDA_FULL_SITE_SUBSET
Definition: enum_quda.h:304

quda::ColorSpinorField::Even
const ColorSpinorField & Even() const
Definition: color_spinor_field.cpp:604

quda::ColorSpinorField::Odd
const ColorSpinorField & Odd() const
Definition: color_spinor_field.cpp:612

quda::ColorSpinorField::Create
static ColorSpinorField * Create(const ColorSpinorParam &param)
Definition: color_spinor_field.cpp:748

quda::ColorSpinorField::GammaBasis
QudaGammaBasis GammaBasis() const
Definition: color_spinor_field.h:438

QUDA_NULL_FIELD_CREATE
Definition: enum_quda.h:330

malloc_quda.h

quda::Int2::x
int x
Definition: transfer.cpp:202

quda::Transfer::fine_to_coarse_d
int * fine_to_coarse_d
Definition: transfer.h:76

quda::Transfer::P
void P(ColorSpinorField &out, const ColorSpinorField &in) const
Definition: transfer.cpp:262

quda::Transfer::fine_tmp_h
ColorSpinorField * fine_tmp_h
Definition: transfer.h:47

quda::Transfer::flops_
double flops_
Definition: transfer.h:150

quda::ColorSpinorField::Ndim
int Ndim() const
Definition: color_spinor_field.h:363

quda::ColorSpinorField::Volume
int Volume() const
Definition: color_spinor_field.h:369

quda::Transfer::setSiteSubset
void setSiteSubset(QudaSiteSubset site_subset, QudaParity parity)
Sets whether the transfer operator is to act on full fields or single parity fields, and if single-parity which parity. If site_subset is QUDA_FULL_SITE_SUBSET, the transfer operator can still be applied to single-parity fields, however, if site_subset is QUDA_PARITY_SITE_SUBSET, then the transfer operator cannot be applied to full fields, and setSiteSubset will need to be called first to reset to QUDA_FULL_SITE_SUBSET. This method exists to reduce GPU memory overhead - if only transfering single-parity fine fields then we only store a single-parity copy of the null space components on the device.
Definition: transfer.cpp:155

quda::Transfer::parity
QudaParity parity
Definition: transfer.h:93

Nspin
int Nspin
Definition: blas_test.cu:45

quda
Definition: blas_cublas.h:6

quda::Transfer::coarse_tmp_d
ColorSpinorField * coarse_tmp_d
Definition: transfer.h:56

quda::FillV
void FillV(ColorSpinorField &V, const std::vector< ColorSpinorField *> &B, int Nvec)
Definition: transfer_util.cu:172

param
QudaGaugeParam param
Definition: pack_test.cpp:17

x
p x
Definition: CMakeCUDACompilerId.cpp1.ii:3011

ndim
static int ndim
Definition: layout_hyper.c:53

multigrid.h

quda::Transfer::coarse_to_fine_h
int * coarse_to_fine_h
Definition: transfer.h:70

quda::Int2::Int2
Int2()
Definition: transfer.cpp:203

quda::Transfer::site_subset
QudaSiteSubset site_subset
Definition: transfer.h:90

quda::Transfer::createGeoMap
void createGeoMap(int *geo_bs)
Definition: transfer.cpp:212

in
cpuColorSpinorField * in
Definition: staggered_invert_test.cpp:44

quda::Transfer::coarse_tmp_h
ColorSpinorField * coarse_tmp_h
Definition: transfer.h:53

V
int V
Definition: test_util.cpp:28

quda::QUDA_PROFILE_COMPUTE
Definition: quda_internal.h:172

fused_exterior_ndeg_tm_dslash_cuda_gen.i
int i
start here
Definition: fused_exterior_ndeg_tm_dslash_cuda_gen.py:816

warningQuda
#define warningQuda(...)
Definition: util_quda.h:101

quda::Restrict
void Restrict(ColorSpinorField &out, const ColorSpinorField &in, const ColorSpinorField &v, int Nvec, const int *fine_to_coarse, const int *coarse_to_fine, const int *spin_map, int parity=QUDA_INVALID_PARITY)
Apply the restriction operator.
Definition: restrictor.cu:509

QUDA_PARITY_SITE_SUBSET
Definition: enum_quda.h:303

QUDA_FLOAT2_FIELD_ORDER
Definition: enum_quda.h:319

quda::Transfer::spin_map
int * spin_map
Definition: transfer.h:87

quda::Transfer::V_h
ColorSpinorField * V_h
Definition: transfer.h:41

QudaParity
enum QudaParity_s QudaParity

quda::Transfer::use_gpu
bool use_gpu
Definition: transfer.h:100

quda::Int2::y
int y
Definition: transfer.cpp:202

quda::qudaDeviceSynchronize
cudaError_t qudaDeviceSynchronize()
Wrapper around cudaDeviceSynchronize or cuDeviceSynchronize.
Definition: quda_cuda_api.cpp:277

safe_malloc
#define safe_malloc(size)
Definition: malloc_quda.h:54

QudaSiteSubset
enum QudaSiteSubset_s QudaSiteSubset

X
int X
Definition: asym_wilson_clover_dslash_dagger_fermi_core.h:394

blas_quda.h

quda::Transfer::fine_to_coarse_h
int * fine_to_coarse_h
Definition: transfer.h:65

quda::ColorSpinorParam
Definition: color_spinor_field.h:80

quda::ColorSpinorField::CreateCoarse
ColorSpinorField * CreateCoarse(const int *geoblockSize, int spinBlockSize, int Nvec, QudaFieldLocation location=QUDA_INVALID_FIELD_LOCATION)
Definition: color_spinor_field.cpp:776

QudaGaugeParam_s::location
QudaFieldLocation location
Definition: quda.h:27

out
cpuColorSpinorField * out
Definition: staggered_invert_test.cpp:45

sprintf
int sprintf(char *, const char *,...) __attribute__((__format__(__printf__

s
size_t s
Definition: CMakeCUDACompilerId.cpp1.ii:2229

printfQuda
#define printfQuda(...)
Definition: util_quda.h:84

quda::Transfer::fillV
void fillV(ColorSpinorField &V)
Definition: transfer.cpp:197

quda::Transfer::Transfer
Transfer(const std::vector< ColorSpinorField *> &B, int Nvec, int *geo_bs, int spin_bs, bool enable_gpu, TimeProfile &profile)
Definition: transfer.cpp:21

transfer.h

device_malloc
#define device_malloc(size)
Definition: malloc_quda.h:52

quda::ColorSpinorField::LatticeIndex
void LatticeIndex(int *y, int i) const
Definition: color_spinor_field.cpp:694

quda::TimeProfile
Definition: quda_internal.h:232

quda::Transfer::V_d
ColorSpinorField * V_d
Definition: transfer.h:44

QUDA_EVEN_PARITY
Definition: enum_quda.h:259

quda::Int2::operator<
bool operator<(const Int2 &a) const
Definition: transfer.cpp:206

QUDA_MAX_DIM
#define QUDA_MAX_DIM
Maximum number of dimensions supported by QUDA. In practice, no routines make use of more than 5...
Definition: quda_constants.h:17

checkCudaError
#define checkCudaError()
Definition: util_quda.h:129

QUDA_ZERO_FIELD_CREATE
Definition: enum_quda.h:331

quda::Transfer::fine_tmp_d
ColorSpinorField * fine_tmp_d
Definition: transfer.h:50

quda::Transfer::createSpinMap
void createSpinMap(int spin_bs)
Definition: transfer.cpp:253

quda::BlockOrthogonalize
void BlockOrthogonalize(ColorSpinorField &V, int Nvec, const int *geo_bs, const int *fine_to_coarse, int spin_bs)
Block orthogonnalize the matrix field, where the blocks are defined by lookup tables that map the fin...
Definition: transfer_util.cu:664

quda::Int2::Int2
Int2(int x, int y)
Definition: transfer.cpp:204

quda::Transfer::B
const std::vector< ColorSpinorField * > & B
Definition: transfer.h:35

quda::Int2
Definition: transfer.cpp:201

d
static __inline__ size_t size_t d
Definition: CMakeCUDACompilerId.cpp1.ii:3019

parity
QudaParity parity
Definition: covdev_test.cpp:53

quda::Transfer::flops
double flops() const
Definition: transfer.cpp:342

QUDA_CPU_FIELD_LOCATION
Definition: enum_quda.h:296

a
#define a
Definition: dw_dslash4_core.h:82

quda::Transfer::coarse_to_fine_d
int * coarse_to_fine_d
Definition: transfer.h:81

quda::Transfer::geo_bs
int * geo_bs
Definition: transfer.h:59

quda::Transfer::~Transfer
virtual ~Transfer()
Definition: transfer.cpp:137

quda::Prolongate
void Prolongate(ColorSpinorField &out, const ColorSpinorField &in, const ColorSpinorField &v, int Nvec, const int *fine_to_coarse, const int *spin_map, int parity=QUDA_INVALID_PARITY)
Apply the prolongation operator.
Definition: prolongator.cu:284

y
int y
Definition: CMakeCUDACompilerId.cpp1.ii:2637

device_free
#define device_free(ptr)
Definition: malloc_quda.h:57