/* File produced by Kranc */ #define KRANC_C #include #include #include #include #include #include "cctk.h" #include "cctk_Arguments.h" #include "cctk_Parameters.h" #include "GenericFD.h" #include "Differencing.h" #include "cctk_Loop.h" #include "loopcontrol.h" #include "OpenCLRunTime.h" #include "vectors.h" /* Define macros used in calculations */ #define INITVALUE (42) #define ScalarINV(x) ((CCTK_REAL)1.0 / (x)) #define ScalarSQR(x) ((x) * (x)) #define ScalarCUB(x) ((x) * ScalarSQR(x)) #define ScalarQAD(x) (ScalarSQR(ScalarSQR(x))) #define INV(x) (kdiv(ToReal(1.0),x)) #define SQR(x) (kmul(x,x)) #define CUB(x) (kmul(x,SQR(x))) #define QAD(x) (SQR(SQR(x))) extern "C" void WT_CL_Energy_SelectBCs(CCTK_ARGUMENTS) { DECLARE_CCTK_ARGUMENTS; DECLARE_CCTK_PARAMETERS; if (cctk_iteration % WT_CL_Energy_calc_every != WT_CL_Energy_calc_offset) return; CCTK_INT ierr CCTK_ATTRIBUTE_UNUSED = 0; ierr = Boundary_SelectGroupForBC(cctkGH, CCTK_ALL_FACES, GenericFD_GetBoundaryWidth(cctkGH), -1 /* no table */, "ML_WaveToy_CL::WT_eps","flat"); if (ierr < 0) CCTK_WARN(1, "Failed to register flat BC for ML_WaveToy_CL::WT_eps."); return; } static void WT_CL_Energy_Body(const cGH* restrict const cctkGH, const int dir, const int face, const CCTK_REAL normal[3], const CCTK_REAL tangentA[3], const CCTK_REAL tangentB[3], const int imin[3], const int imax[3], const int n_subblock_gfs, CCTK_REAL* restrict const subblock_gfs[]) { DECLARE_CCTK_ARGUMENTS; DECLARE_CCTK_PARAMETERS; const char* const source = "\n" "/* Include user-supplied include files */\n" "\n" "/* Initialise finite differencing variables */\n" "const ptrdiff_t di CCTK_ATTRIBUTE_UNUSED = 1;\n" "const ptrdiff_t dj CCTK_ATTRIBUTE_UNUSED = CCTK_GFINDEX3D(cctkGH,0,1,0) - CCTK_GFINDEX3D(cctkGH,0,0,0);\n" "const ptrdiff_t dk CCTK_ATTRIBUTE_UNUSED = CCTK_GFINDEX3D(cctkGH,0,0,1) - CCTK_GFINDEX3D(cctkGH,0,0,0);\n" "const ptrdiff_t cdi CCTK_ATTRIBUTE_UNUSED = sizeof(CCTK_REAL) * di;\n" "const ptrdiff_t cdj CCTK_ATTRIBUTE_UNUSED = sizeof(CCTK_REAL) * dj;\n" "const ptrdiff_t cdk CCTK_ATTRIBUTE_UNUSED = sizeof(CCTK_REAL) * dk;\n" "const CCTK_REAL_VEC dx CCTK_ATTRIBUTE_UNUSED = ToReal(CCTK_DELTA_SPACE(0));\n" "const CCTK_REAL_VEC dy CCTK_ATTRIBUTE_UNUSED = ToReal(CCTK_DELTA_SPACE(1));\n" "const CCTK_REAL_VEC dz CCTK_ATTRIBUTE_UNUSED = ToReal(CCTK_DELTA_SPACE(2));\n" "const CCTK_REAL_VEC dt CCTK_ATTRIBUTE_UNUSED = ToReal(CCTK_DELTA_TIME);\n" "const CCTK_REAL_VEC t CCTK_ATTRIBUTE_UNUSED = ToReal(cctk_time);\n" "const CCTK_REAL_VEC dxi CCTK_ATTRIBUTE_UNUSED = INV(dx);\n" "const CCTK_REAL_VEC dyi CCTK_ATTRIBUTE_UNUSED = INV(dy);\n" "const CCTK_REAL_VEC dzi CCTK_ATTRIBUTE_UNUSED = INV(dz);\n" "const CCTK_REAL_VEC khalf CCTK_ATTRIBUTE_UNUSED = ToReal(0.5);\n" "const CCTK_REAL_VEC kthird CCTK_ATTRIBUTE_UNUSED = \n" " ToReal(0.333333333333333333333333333333);\n" "const CCTK_REAL_VEC ktwothird CCTK_ATTRIBUTE_UNUSED = \n" " ToReal(0.666666666666666666666666666667);\n" "const CCTK_REAL_VEC kfourthird CCTK_ATTRIBUTE_UNUSED = \n" " ToReal(1.33333333333333333333333333333);\n" "const CCTK_REAL_VEC hdxi CCTK_ATTRIBUTE_UNUSED = \n" " kmul(dxi,ToReal(0.5));\n" "const CCTK_REAL_VEC hdyi CCTK_ATTRIBUTE_UNUSED = \n" " kmul(dyi,ToReal(0.5));\n" "const CCTK_REAL_VEC hdzi CCTK_ATTRIBUTE_UNUSED = \n" " kmul(dzi,ToReal(0.5));\n" "\n" "/* Initialize predefined quantities */\n" "const CCTK_REAL_VEC p1o12dx CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(0.0833333333333333333333333333333),dx);\n" "const CCTK_REAL_VEC p1o12dy CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(0.0833333333333333333333333333333),dy);\n" "const CCTK_REAL_VEC p1o12dz CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(0.0833333333333333333333333333333),dz);\n" "const CCTK_REAL_VEC p1o144dxdy CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(0.00694444444444444444444444444444),kmul(dy,dx));\n" "const CCTK_REAL_VEC p1o144dxdz CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(0.00694444444444444444444444444444),kmul(dz,dx));\n" "const CCTK_REAL_VEC p1o144dydz CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(0.00694444444444444444444444444444),kmul(dz,dy));\n" "const CCTK_REAL_VEC pm1o12dx2 CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(-0.0833333333333333333333333333333),kmul(dx,dx));\n" "const CCTK_REAL_VEC pm1o12dy2 CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(-0.0833333333333333333333333333333),kmul(dy,dy));\n" "const CCTK_REAL_VEC pm1o12dz2 CCTK_ATTRIBUTE_UNUSED = kdiv(ToReal(-0.0833333333333333333333333333333),kmul(dz,dz));\n" "\n" "/* Assign local copies of arrays functions */\n" "\n" "\n" "\n" "/* Calculate temporaries and arrays functions */\n" "\n" "/* Copy local copies back to grid functions */\n" "\n" "/* Loop over the grid points */\n" "const int imin0=imin[0];\n" "const int imin1=imin[1];\n" "const int imin2=imin[2];\n" "const int imax0=imax[0];\n" "const int imax1=imax[1];\n" "const int imax2=imax[2];\n" "#pragma omp parallel // reduction(+: vec_iter_counter, vec_op_counter, vec_mem_counter)\n" "CCTK_LOOP3STR(WT_CL_Energy,\n" " i,j,k, imin0,imin1,imin2, imax0,imax1,imax2,\n" " cctk_ash[0],cctk_ash[1],cctk_ash[2],\n" " vecimin,vecimax, CCTK_REAL_VEC_SIZE)\n" "{\n" " const ptrdiff_t index CCTK_ATTRIBUTE_UNUSED = di*i + dj*j + dk*k;\n" " // vec_iter_counter+=CCTK_REAL_VEC_SIZE;\n" " \n" " /* Assign local copies of grid functions */\n" " \n" " CCTK_REAL_VEC rhoL CCTK_ATTRIBUTE_UNUSED = vec_load(rho[index]);\n" " CCTK_REAL_VEC uL CCTK_ATTRIBUTE_UNUSED = vec_load(u[index]);\n" " \n" " \n" " /* Include user supplied include files */\n" " \n" " /* Precompute derivatives */\n" " const CCTK_REAL_VEC PDstandardNth1u CCTK_ATTRIBUTE_UNUSED = PDstandardNth1(&u[index]);\n" " const CCTK_REAL_VEC PDstandardNth2u CCTK_ATTRIBUTE_UNUSED = PDstandardNth2(&u[index]);\n" " const CCTK_REAL_VEC PDstandardNth3u CCTK_ATTRIBUTE_UNUSED = PDstandardNth3(&u[index]);\n" " \n" " /* Calculate temporaries and grid functions */\n" " CCTK_REAL_VEC epsL CCTK_ATTRIBUTE_UNUSED = \n" " kmul(kmadd(rhoL,rhoL,kmadd(PDstandardNth1u,PDstandardNth1u,kmadd(PDstandardNth2u,PDstandardNth2u,kmul(PDstandardNth3u,PDstandardNth3u)))),ToReal(0.5));\n" " \n" " /* Copy local copies back to grid functions */\n" " vec_store_partial_prepare(i,lc_imin,lc_imax);\n" " vec_store_nta_partial(eps[index],epsL);\n" "}\n" "CCTK_ENDLOOP3STR(WT_CL_Energy);\n" "" ; const char* const groups[] = { "ML_WaveToy_CL::WT_eps", "ML_WaveToy_CL::WT_rho", "ML_WaveToy_CL::WT_u", NULL}; static struct OpenCLKernel *kernel = NULL; const char* const sources[] = {differencing, source, NULL}; OpenCLRunTime_CallKernel(cctkGH, CCTK_THORNSTRING, "WT_CL_Energy", sources, groups, NULL, NULL, NULL, -1, imin, imax, &kernel); } extern "C" void WT_CL_Energy(CCTK_ARGUMENTS) { DECLARE_CCTK_ARGUMENTS; DECLARE_CCTK_PARAMETERS; if (verbose > 1) { CCTK_VInfo(CCTK_THORNSTRING,"Entering WT_CL_Energy_Body"); } if (cctk_iteration % WT_CL_Energy_calc_every != WT_CL_Energy_calc_offset) { return; } const char* const groups[] = { "ML_WaveToy_CL::WT_eps", "ML_WaveToy_CL::WT_rho", "ML_WaveToy_CL::WT_u"}; GenericFD_AssertGroupStorage(cctkGH, "WT_CL_Energy", 3, groups); GenericFD_EnsureStencilFits(cctkGH, "WT_CL_Energy", 2, 2, 2); GenericFD_LoopOverInterior(cctkGH, WT_CL_Energy_Body); if (verbose > 1) { CCTK_VInfo(CCTK_THORNSTRING,"Leaving WT_CL_Energy_Body"); } }