|
QUDA v0.3.2
A library for QCD on GPUs
|
#include <stdio.h>#include <stdlib.h>#include <quda_internal.h>#include <color_spinor_field.h>#include <blas_quda.h>#include <test_util.h>#include "../lib/blas_param.h"Go to the source code of this file.
Functions | |
| void | setPrec (ColorSpinorParam ¶m, const QudaPrecision precision) |
| bool | isReduction (int kernel) |
| void | initFields (int prec) |
| void | freeFields () |
| double | benchmark (int kernel, int niter) |
| void | write (char *names[], int threads[][3], int blocks[][3]) |
| int | main (int argc, char **argv) |
Variables | |
| const int | LX = 24 |
| const int | LY = 24 |
| const int | LZ = 24 |
| const int | LT = 24 |
| const int | Nspin = 4 |
| const int | Niter = 10 * (24*24*24*24*4) / (LX * LY * LZ * LT * Nspin) |
| const int | Nkernels = 24 |
| const int | ThreadMin = 32 |
| const int | ThreadMax = 1024 |
| const int | GridMin = 1 |
| const int | GridMax = 65536 |
| cudaColorSpinorField * | x |
| cudaColorSpinorField * | y |
| cudaColorSpinorField * | z |
| cudaColorSpinorField * | w |
| cudaColorSpinorField * | v |
| cudaColorSpinorField * | h |
| cudaColorSpinorField * | l |
| double benchmark | ( | int | kernel, |
| int | niter | ||
| ) |
Definition at line 126 of file blas_test.cu.
| void freeFields | ( | ) |
Definition at line 113 of file blas_test.cu.
| void initFields | ( | int | prec | ) |
Definition at line 50 of file blas_test.cu.
| bool isReduction | ( | int | kernel | ) |
Definition at line 44 of file blas_test.cu.
| int main | ( | int | argc, |
| char ** | argv | ||
| ) |
Definition at line 284 of file blas_test.cu.
| void setPrec | ( | ColorSpinorParam & | param, |
| const QudaPrecision | precision | ||
| ) |
Definition at line 32 of file blas_test.cu.
| void write | ( | char * | names[], |
| int | threads[][3], | ||
| int | blocks[][3] | ||
| ) |
Definition at line 257 of file blas_test.cu.
| const int GridMax = 65536 |
Definition at line 24 of file blas_test.cu.
| const int GridMin = 1 |
Definition at line 23 of file blas_test.cu.
Definition at line 26 of file blas_test.cu.
Definition at line 26 of file blas_test.cu.
| const int LT = 24 |
Definition at line 14 of file blas_test.cu.
| const int LX = 24 |
Definition at line 11 of file blas_test.cu.
| const int LY = 24 |
Definition at line 12 of file blas_test.cu.
| const int LZ = 24 |
Definition at line 13 of file blas_test.cu.
Definition at line 18 of file blas_test.cu.
| const int Nkernels = 24 |
Definition at line 20 of file blas_test.cu.
| const int Nspin = 4 |
Definition at line 15 of file blas_test.cu.
| const int ThreadMax = 1024 |
Definition at line 22 of file blas_test.cu.
| const int ThreadMin = 32 |
Definition at line 21 of file blas_test.cu.
Definition at line 26 of file blas_test.cu.
Definition at line 26 of file blas_test.cu.
Definition at line 26 of file blas_test.cu.
Definition at line 26 of file blas_test.cu.
Definition at line 26 of file blas_test.cu.
1.7.3