|
file | blas_cublas.cu [code] |
|
file | blas_magma.cu [code] |
|
file | blas_magma_nopiv.cu [code] |
|
file | blas_quda.cu [code] |
|
file | block_orthogonalize.cu [code] |
|
file | check_params.h [code] |
|
file | checksum.cu [code] |
|
file | clover_deriv_quda.cu [code] |
| This kernel has been a bit of a pain to optimize since it is excessively register bound. To reduce register pressure we use shared memory to help offload some of this pressure. Annoyingly, the optimal approach for CUDA 8.0 is not the same as CUDA 7.5, so implementation is compiler version dependent. The CUDA 8.0 optimal code runs 10x slower on 7.5, though the 7.5 code runs fine on 8.0.
|
|
file | clover_field.cpp [code] |
|
file | clover_invert.cu [code] |
|
file | clover_outer_product.cu [code] |
|
file | clover_quda.cu [code] |
|
file | clover_sigma_outer_product.cu [code] |
|
file | clover_trace_quda.cu [code] |
|
file | coarse_op.cu [code] |
|
file | coarse_op.cuh [code] |
|
file | coarse_op_preconditioned.cu [code] |
|
file | coarsecoarse_op.cu [code] |
|
file | color_spinor_field.cpp [code] |
|
file | color_spinor_pack.cu [code] |
| This is the implementation of the color-spinor halo packer for an arbitrary field. This implementation uses the fine-grained accessors and should support all field types reqgardless of precision, number of color or spins etc.
|
|
file | color_spinor_util.cu [code] |
|
file | color_spinor_wuppertal.cu [code] |
|
file | comm_common.cpp [code] |
|
file | comm_mpi.cpp [code] |
|
file | comm_qmp.cpp [code] |
|
file | comm_single.cpp [code] |
|
file | contract.cu [code] |
|
file | copy_clover.cu [code] |
|
file | copy_color_spinor.cu [code] |
|
file | copy_color_spinor.cuh [code] |
|
file | copy_color_spinor_dd.cu [code] |
|
file | copy_color_spinor_dh.cu [code] |
|
file | copy_color_spinor_dq.cu [code] |
|
file | copy_color_spinor_ds.cu [code] |
|
file | copy_color_spinor_hd.cu [code] |
|
file | copy_color_spinor_hh.cu [code] |
|
file | copy_color_spinor_hq.cu [code] |
|
file | copy_color_spinor_hs.cu [code] |
|
file | copy_color_spinor_mg.cuh [code] |
|
file | copy_color_spinor_mg_dd.cu [code] |
|
file | copy_color_spinor_mg_ds.cu [code] |
|
file | copy_color_spinor_mg_hh.cu [code] |
|
file | copy_color_spinor_mg_hq.cu [code] |
|
file | copy_color_spinor_mg_hs.cu [code] |
|
file | copy_color_spinor_mg_qh.cu [code] |
|
file | copy_color_spinor_mg_qq.cu [code] |
|
file | copy_color_spinor_mg_qs.cu [code] |
|
file | copy_color_spinor_mg_sd.cu [code] |
|
file | copy_color_spinor_mg_sh.cu [code] |
|
file | copy_color_spinor_mg_sq.cu [code] |
|
file | copy_color_spinor_mg_ss.cu [code] |
|
file | copy_color_spinor_qd.cu [code] |
|
file | copy_color_spinor_qh.cu [code] |
|
file | copy_color_spinor_qq.cu [code] |
|
file | copy_color_spinor_qs.cu [code] |
|
file | copy_color_spinor_sd.cu [code] |
|
file | copy_color_spinor_sh.cu [code] |
|
file | copy_color_spinor_sq.cu [code] |
|
file | copy_color_spinor_ss.cu [code] |
|
file | copy_gauge.cu [code] |
|
file | copy_gauge_double.cu [code] |
|
file | copy_gauge_extended.cu [code] |
|
file | copy_gauge_half.cu [code] |
|
file | copy_gauge_helper.cuh [code] |
|
file | copy_gauge_inc.cu [code] |
|
file | copy_gauge_mg.cu [code] |
|
file | copy_gauge_quarter.cu [code] |
|
file | copy_gauge_single.cu [code] |
|
file | copy_quda.cu [code] |
|
file | covDev.cu [code] |
|
file | cpu_color_spinor_field.cpp [code] |
|
file | cpu_gauge_field.cpp [code] |
|
file | cuda_color_spinor_field.cpp [code] |
|
file | cuda_gauge_field.cpp [code] |
|
file | CUFFT_Plans.h [code] |
|
file | deflation.cpp [code] |
|
file | dirac.cpp [code] |
|
file | dirac_clover.cpp [code] |
|
file | dirac_coarse.cpp [code] |
|
file | dirac_domain_wall.cpp [code] |
|
file | dirac_domain_wall_4d.cpp [code] |
|
file | dirac_improved_staggered.cpp [code] |
|
file | dirac_mobius.cpp [code] |
|
file | dirac_staggered.cpp [code] |
|
file | dirac_twisted_clover.cpp [code] |
|
file | dirac_twisted_mass.cpp [code] |
|
file | dirac_wilson.cpp [code] |
|
file | dslash5_domain_wall.cu [code] |
|
file | dslash_coarse.cu [code] |
|
file | dslash_constants.h [code] |
|
file | dslash_domain_wall_4d.cu [code] |
|
file | dslash_domain_wall_5d.cu [code] |
|
file | dslash_improved_staggered.cu [code] |
|
file | dslash_index.cuh [code] |
|
file | dslash_ndeg_twisted_mass.cu [code] |
|
file | dslash_ndeg_twisted_mass_preconditioned.cu [code] |
|
file | dslash_pack2.cu [code] |
|
file | dslash_policy.cuh [code] |
|
file | dslash_quda.cu [code] |
|
file | dslash_quda.cuh [code] |
|
file | dslash_staggered.cu [code] |
|
file | dslash_twisted_clover.cu [code] |
|
file | dslash_twisted_clover_preconditioned.cu [code] |
|
file | dslash_twisted_mass.cu [code] |
|
file | dslash_twisted_mass_preconditioned.cu [code] |
|
file | dslash_wilson.cu [code] |
|
file | dslash_wilson_clover.cu [code] |
|
file | dslash_wilson_clover_preconditioned.cu [code] |
|
file | eigensolve_quda.cpp [code] |
|
file | extended_color_spinor_utilities.cu [code] |
|
|
|
|
|
file | gauge_ape.cu [code] |
|
file | gauge_covdev.cpp [code] |
|
file | gauge_field.cpp [code] |
|
file | gauge_field_strength_tensor.cu [code] |
|
file | gauge_fix_fft.cu [code] |
|
file | gauge_fix_ovr.cu [code] |
|
|
|
file | gauge_fix_ovr_hit_devf.cuh [code] |
|
file | gauge_force.cu [code] |
|
file | gauge_laplace.cpp [code] |
|
file | gauge_phase.cu [code] |
|
file | gauge_plaq.cu [code] |
|
file | gauge_qcharge.cu [code] |
|
file | gauge_random.cu [code] |
|
file | gauge_stout.cu [code] |
|
file | gauge_update_quda.cu [code] |
|
file | generic_blas.cuh [code] |
|
file | generic_reduce.cuh [code] |
|
file | hisq_paths_force_quda.cu [code] |
|
file | interface_quda.cpp [code] |
|
file | inv_bicgstab_quda.cpp [code] |
|
file | inv_bicgstabl_quda.cpp [code] |
|
file | inv_ca_cg.cpp [code] |
|
file | inv_ca_gcr.cpp [code] |
|
file | inv_cg3_quda.cpp [code] |
|
file | inv_cg3ne_quda.cpp [code] |
|
file | inv_cg_quda.cpp [code] |
|
file | inv_eigcg_quda.cpp [code] |
|
file | inv_gcr_quda.cpp [code] |
|
file | inv_gmresdr_quda.cpp [code] |
|
file | inv_mpbicgstab_quda.cpp [code] |
|
file | inv_mpcg_quda.cpp [code] |
|
file | inv_mr_quda.cpp [code] |
|
file | inv_mre.cpp [code] |
|
file | inv_msrc_cg_quda.cpp [code] |
|
file | inv_multi_cg_quda.cpp [code] |
|
file | inv_pcg_quda.cpp [code] |
|
file | inv_sbicgstab_quda.cpp [code] |
|
file | inv_sd_quda.cpp [code] |
|
file | inv_xsd_quda.cpp [code] |
|
file | ks_force_quda.cu [code] |
|
file | laplace.cu [code] |
|
file | lattice_field.cpp [code] |
|
file | layout_hyper.c [code] |
|
file | llfat_quda.cu [code] |
|
file | malloc.cpp [code] |
|
file | max_clover.cu [code] |
|
file | max_gauge.cu [code] |
|
file | milc_interface.cpp [code] |
|
file | momentum.cu [code] |
|
file | multi_blas_quda.cu [code] |
|
file | multi_reduce_quda.cu [code] |
|
file | multigrid.cpp [code] |
|
file | numa_affinity.cpp [code] |
|
file | nvtx_pmpi.c [code] |
|
file | pgauge_det_trace.cu [code] |
|
file | pgauge_exchange.cu [code] |
|
file | pgauge_heatbath.cu [code] |
|
file | pgauge_init.cu [code] |
|
file | prolongator.cu [code] |
|
file | qio_field.cpp [code] |
|
file | qio_util.cpp [code] |
|
file | quda_arpack_interface.cpp [code] |
|
file | quda_cuda_api.cpp [code] |
|
file | random.cu [code] |
|
file | reduce_quda.cu [code] |
|
file | restrictor.cu [code] |
|
file | shift_quark_field.cu [code] |
|
file | solver.cpp [code] |
|
file | spinor_noise.cu [code] |
|
file | staggered_oprod.cu [code] |
|
file | svd_quda.h [code] |
|
file | timer.cpp [code] |
|
file | transfer.cpp [code] |
|
file | tune.cpp [code] |
|
file | unitarize_force_quda.cu [code] |
|
file | unitarize_links_quda.cu [code] |
|
file | util_quda.cpp [code] |
|
file | version.cpp [code] |
|