/* File produced by Kranc */ #define KRANC_C #include #include #include #include #include #include "cctk.h" #include "cctk_Arguments.h" #include "cctk_Parameters.h" #include "GenericFD.h" #include "Differencing.h" #include "cctk_Loop.h" #include "loopcontrol.h" #include "OpenCLRunTime.h" #include "vectors.h" /* Define macros used in calculations */ #define INITVALUE (42) #define QAD(x) (SQR(SQR(x))) #define INV(x) (kdiv(ToReal(1.0),x)) #define SQR(x) (kmul(x,x)) #define CUB(x) (kmul(x,SQR(x))) extern "C" void EM_evol_SelectBCs(CCTK_ARGUMENTS) { DECLARE_CCTK_ARGUMENTS; DECLARE_CCTK_PARAMETERS; CCTK_INT ierr = 0; ierr = Boundary_SelectGroupForBC(cctkGH, CCTK_ALL_FACES, GenericFD_GetBoundaryWidth(cctkGH), -1 /* no table */, "My_New_Implementation::B_grouprhs","flat"); if (ierr < 0) CCTK_WARN(1, "Failed to register flat BC for My_New_Implementation::B_grouprhs."); ierr = Boundary_SelectGroupForBC(cctkGH, CCTK_ALL_FACES, GenericFD_GetBoundaryWidth(cctkGH), -1 /* no table */, "My_New_Implementation::El_grouprhs","flat"); if (ierr < 0) CCTK_WARN(1, "Failed to register flat BC for My_New_Implementation::El_grouprhs."); return; } static void EM_evol_Body(cGH const * restrict const cctkGH, int const dir, int const face, CCTK_REAL const normal[3], CCTK_REAL const tangentA[3], CCTK_REAL const tangentB[3], int const imin[3], int const imax[3], int const n_subblock_gfs, CCTK_REAL * restrict const subblock_gfs[]) { DECLARE_CCTK_ARGUMENTS; DECLARE_CCTK_PARAMETERS; char const * const source = "\n" "/* Declare finite differencing variables */\n" "\n" "/* Include user-supplied include files */\n" "\n" "/* Initialise finite differencing variables */\n" "ptrdiff_t const di = 1;\n" "ptrdiff_t const dj = CCTK_GFINDEX3D(cctkGH,0,1,0) - CCTK_GFINDEX3D(cctkGH,0,0,0);\n" "ptrdiff_t const dk = CCTK_GFINDEX3D(cctkGH,0,0,1) - CCTK_GFINDEX3D(cctkGH,0,0,0);\n" "ptrdiff_t const cdi = sizeof(CCTK_REAL) * di;\n" "ptrdiff_t const cdj = sizeof(CCTK_REAL) * dj;\n" "ptrdiff_t const cdk = sizeof(CCTK_REAL) * dk;\n" "CCTK_REAL_VEC const dx = ToReal(CCTK_DELTA_SPACE(0));\n" "CCTK_REAL_VEC const dy = ToReal(CCTK_DELTA_SPACE(1));\n" "CCTK_REAL_VEC const dz = ToReal(CCTK_DELTA_SPACE(2));\n" "CCTK_REAL_VEC const dt = ToReal(CCTK_DELTA_TIME);\n" "CCTK_REAL_VEC const t = ToReal(cctk_time);\n" "CCTK_REAL_VEC const dxi = INV(dx);\n" "CCTK_REAL_VEC const dyi = INV(dy);\n" "CCTK_REAL_VEC const dzi = INV(dz);\n" "CCTK_REAL_VEC const khalf = ToReal(0.5);\n" "CCTK_REAL_VEC const kthird = ToReal(1.0/3.0);\n" "CCTK_REAL_VEC const ktwothird = ToReal(2.0/3.0);\n" "CCTK_REAL_VEC const kfourthird = ToReal(4.0/3.0);\n" "CCTK_REAL_VEC const keightthird = ToReal(8.0/3.0);\n" "CCTK_REAL_VEC const hdxi = kmul(ToReal(0.5), dxi);\n" "CCTK_REAL_VEC const hdyi = kmul(ToReal(0.5), dyi);\n" "CCTK_REAL_VEC const hdzi = kmul(ToReal(0.5), dzi);\n" "\n" "/* Initialize predefined quantities */\n" "CCTK_REAL_VEC const p1o12dx = kmul(INV(dx),ToReal(0.0833333333333333333333333333333));\n" "CCTK_REAL_VEC const p1o12dy = kmul(INV(dy),ToReal(0.0833333333333333333333333333333));\n" "CCTK_REAL_VEC const p1o12dz = kmul(INV(dz),ToReal(0.0833333333333333333333333333333));\n" "CCTK_REAL_VEC const p1o144dxdy = kmul(INV(dx),kmul(INV(dy),ToReal(0.00694444444444444444444444444444)));\n" "CCTK_REAL_VEC const p1o144dxdz = kmul(INV(dx),kmul(INV(dz),ToReal(0.00694444444444444444444444444444)));\n" "CCTK_REAL_VEC const p1o144dydz = kmul(INV(dy),kmul(INV(dz),ToReal(0.00694444444444444444444444444444)));\n" "CCTK_REAL_VEC const p1o2dx = kmul(INV(dx),ToReal(0.5));\n" "CCTK_REAL_VEC const p1o2dy = kmul(INV(dy),ToReal(0.5));\n" "CCTK_REAL_VEC const p1o2dz = kmul(INV(dz),ToReal(0.5));\n" "CCTK_REAL_VEC const p1o4dxdy = kmul(INV(dx),kmul(INV(dy),ToReal(0.25)));\n" "CCTK_REAL_VEC const p1o4dxdz = kmul(INV(dx),kmul(INV(dz),ToReal(0.25)));\n" "CCTK_REAL_VEC const p1o4dydz = kmul(INV(dy),kmul(INV(dz),ToReal(0.25)));\n" "CCTK_REAL_VEC const p1odx2 = INV(SQR(dx));\n" "CCTK_REAL_VEC const p1ody2 = INV(SQR(dy));\n" "CCTK_REAL_VEC const p1odz2 = INV(SQR(dz));\n" "CCTK_REAL_VEC const pm1o12dx2 = kmul(INV(SQR(dx)),ToReal(-0.0833333333333333333333333333333));\n" "CCTK_REAL_VEC const pm1o12dy2 = kmul(INV(SQR(dy)),ToReal(-0.0833333333333333333333333333333));\n" "CCTK_REAL_VEC const pm1o12dz2 = kmul(INV(SQR(dz)),ToReal(-0.0833333333333333333333333333333));\n" "\n" "/* Jacobian variable pointers */\n" "bool const use_jacobian = (!CCTK_IsFunctionAliased(\"MultiPatch_GetMap\") || MultiPatch_GetMap(cctkGH) != jacobian_identity_map)\n" " && strlen(jacobian_group) > 0;\n" "if (use_jacobian && strlen(jacobian_derivative_group) == 0)\n" "{\n" " CCTK_WARN (1, \"GenericFD::jacobian_group and GenericFD::jacobian_derivative_group must both be set to valid group names\");\n" "}\n" "\n" "CCTK_REAL const *restrict jacobian_ptrs[9];\n" "if (use_jacobian) GenericFD_GroupDataPointers(cctkGH, jacobian_group,\n" " 9, jacobian_ptrs);\n" "\n" "CCTK_REAL const *restrict const J11 = use_jacobian ? jacobian_ptrs[0] : 0;\n" "CCTK_REAL const *restrict const J12 = use_jacobian ? jacobian_ptrs[1] : 0;\n" "CCTK_REAL const *restrict const J13 = use_jacobian ? jacobian_ptrs[2] : 0;\n" "CCTK_REAL const *restrict const J21 = use_jacobian ? jacobian_ptrs[3] : 0;\n" "CCTK_REAL const *restrict const J22 = use_jacobian ? jacobian_ptrs[4] : 0;\n" "CCTK_REAL const *restrict const J23 = use_jacobian ? jacobian_ptrs[5] : 0;\n" "CCTK_REAL const *restrict const J31 = use_jacobian ? jacobian_ptrs[6] : 0;\n" "CCTK_REAL const *restrict const J32 = use_jacobian ? jacobian_ptrs[7] : 0;\n" "CCTK_REAL const *restrict const J33 = use_jacobian ? jacobian_ptrs[8] : 0;\n" "\n" "CCTK_REAL const *restrict jacobian_derivative_ptrs[18];\n" "if (use_jacobian) GenericFD_GroupDataPointers(cctkGH, jacobian_derivative_group,\n" " 18, jacobian_derivative_ptrs);\n" "\n" "CCTK_REAL const *restrict const dJ111 = use_jacobian ? jacobian_derivative_ptrs[0] : 0;\n" "CCTK_REAL const *restrict const dJ112 = use_jacobian ? jacobian_derivative_ptrs[1] : 0;\n" "CCTK_REAL const *restrict const dJ113 = use_jacobian ? jacobian_derivative_ptrs[2] : 0;\n" "CCTK_REAL const *restrict const dJ122 = use_jacobian ? jacobian_derivative_ptrs[3] : 0;\n" "CCTK_REAL const *restrict const dJ123 = use_jacobian ? jacobian_derivative_ptrs[4] : 0;\n" "CCTK_REAL const *restrict const dJ133 = use_jacobian ? jacobian_derivative_ptrs[5] : 0;\n" "CCTK_REAL const *restrict const dJ211 = use_jacobian ? jacobian_derivative_ptrs[6] : 0;\n" "CCTK_REAL const *restrict const dJ212 = use_jacobian ? jacobian_derivative_ptrs[7] : 0;\n" "CCTK_REAL const *restrict const dJ213 = use_jacobian ? jacobian_derivative_ptrs[8] : 0;\n" "CCTK_REAL const *restrict const dJ222 = use_jacobian ? jacobian_derivative_ptrs[9] : 0;\n" "CCTK_REAL const *restrict const dJ223 = use_jacobian ? jacobian_derivative_ptrs[10] : 0;\n" "CCTK_REAL const *restrict const dJ233 = use_jacobian ? jacobian_derivative_ptrs[11] : 0;\n" "CCTK_REAL const *restrict const dJ311 = use_jacobian ? jacobian_derivative_ptrs[12] : 0;\n" "CCTK_REAL const *restrict const dJ312 = use_jacobian ? jacobian_derivative_ptrs[13] : 0;\n" "CCTK_REAL const *restrict const dJ313 = use_jacobian ? jacobian_derivative_ptrs[14] : 0;\n" "CCTK_REAL const *restrict const dJ322 = use_jacobian ? jacobian_derivative_ptrs[15] : 0;\n" "CCTK_REAL const *restrict const dJ323 = use_jacobian ? jacobian_derivative_ptrs[16] : 0;\n" "CCTK_REAL const *restrict const dJ333 = use_jacobian ? jacobian_derivative_ptrs[17] : 0;\n" "\n" "/* Assign local copies of arrays functions */\n" "\n" "\n" "\n" "/* Calculate temporaries and arrays functions */\n" "\n" "/* Copy local copies back to grid functions */\n" "\n" "/* Loop over the grid points */\n" "#pragma omp parallel\n" "LC_LOOP3VEC (EM_evol,\n" " i,j,k, imin[0],imin[1],imin[2], imax[0],imax[1],imax[2],\n" " cctk_lsh[0],cctk_lsh[1],cctk_lsh[2],\n" " CCTK_REAL_VEC_SIZE)\n" "{\n" " ptrdiff_t const index = di*i + dj*j + dk*k;\n" " \n" " /* Assign local copies of grid functions */\n" " \n" " CCTK_REAL_VEC B1L = vec_load(B1[index]);\n" " CCTK_REAL_VEC B2L = vec_load(B2[index]);\n" " CCTK_REAL_VEC B3L = vec_load(B3[index]);\n" " CCTK_REAL_VEC El1L = vec_load(El1[index]);\n" " CCTK_REAL_VEC El2L = vec_load(El2[index]);\n" " CCTK_REAL_VEC El3L = vec_load(El3[index]);\n" " \n" " \n" " CCTK_REAL_VEC J11L, J12L, J13L, J21L, J22L, J23L, J31L, J32L, J33L;\n" " \n" " if (use_jacobian)\n" " {\n" " J11L = vec_load(J11[index]);\n" " J12L = vec_load(J12[index]);\n" " J13L = vec_load(J13[index]);\n" " J21L = vec_load(J21[index]);\n" " J22L = vec_load(J22[index]);\n" " J23L = vec_load(J23[index]);\n" " J31L = vec_load(J31[index]);\n" " J32L = vec_load(J32[index]);\n" " J33L = vec_load(J33[index]);\n" " }\n" " \n" " /* Include user supplied include files */\n" " \n" " /* Precompute derivatives */\n" " CCTK_REAL_VEC PDstandard1B1;\n" " CCTK_REAL_VEC PDstandard2B1;\n" " CCTK_REAL_VEC PDstandard3B1;\n" " CCTK_REAL_VEC PDstandard1B2;\n" " CCTK_REAL_VEC PDstandard2B2;\n" " CCTK_REAL_VEC PDstandard3B2;\n" " CCTK_REAL_VEC PDstandard1B3;\n" " CCTK_REAL_VEC PDstandard2B3;\n" " CCTK_REAL_VEC PDstandard3B3;\n" " CCTK_REAL_VEC PDstandard1El1;\n" " CCTK_REAL_VEC PDstandard2El1;\n" " CCTK_REAL_VEC PDstandard3El1;\n" " CCTK_REAL_VEC PDstandard1El2;\n" " CCTK_REAL_VEC PDstandard2El2;\n" " CCTK_REAL_VEC PDstandard3El2;\n" " CCTK_REAL_VEC PDstandard1El3;\n" " CCTK_REAL_VEC PDstandard2El3;\n" " CCTK_REAL_VEC PDstandard3El3;\n" " \n" " switch(fdOrder)\n" " {\n" " case 2:\n" " PDstandard1B1 = PDstandardfdOrder21(&B1[index]);\n" " PDstandard2B1 = PDstandardfdOrder22(&B1[index]);\n" " PDstandard3B1 = PDstandardfdOrder23(&B1[index]);\n" " PDstandard1B2 = PDstandardfdOrder21(&B2[index]);\n" " PDstandard2B2 = PDstandardfdOrder22(&B2[index]);\n" " PDstandard3B2 = PDstandardfdOrder23(&B2[index]);\n" " PDstandard1B3 = PDstandardfdOrder21(&B3[index]);\n" " PDstandard2B3 = PDstandardfdOrder22(&B3[index]);\n" " PDstandard3B3 = PDstandardfdOrder23(&B3[index]);\n" " PDstandard1El1 = PDstandardfdOrder21(&El1[index]);\n" " PDstandard2El1 = PDstandardfdOrder22(&El1[index]);\n" " PDstandard3El1 = PDstandardfdOrder23(&El1[index]);\n" " PDstandard1El2 = PDstandardfdOrder21(&El2[index]);\n" " PDstandard2El2 = PDstandardfdOrder22(&El2[index]);\n" " PDstandard3El2 = PDstandardfdOrder23(&El2[index]);\n" " PDstandard1El3 = PDstandardfdOrder21(&El3[index]);\n" " PDstandard2El3 = PDstandardfdOrder22(&El3[index]);\n" " PDstandard3El3 = PDstandardfdOrder23(&El3[index]);\n" " break;\n" " \n" " case 4:\n" " PDstandard1B1 = PDstandardfdOrder41(&B1[index]);\n" " PDstandard2B1 = PDstandardfdOrder42(&B1[index]);\n" " PDstandard3B1 = PDstandardfdOrder43(&B1[index]);\n" " PDstandard1B2 = PDstandardfdOrder41(&B2[index]);\n" " PDstandard2B2 = PDstandardfdOrder42(&B2[index]);\n" " PDstandard3B2 = PDstandardfdOrder43(&B2[index]);\n" " PDstandard1B3 = PDstandardfdOrder41(&B3[index]);\n" " PDstandard2B3 = PDstandardfdOrder42(&B3[index]);\n" " PDstandard3B3 = PDstandardfdOrder43(&B3[index]);\n" " PDstandard1El1 = PDstandardfdOrder41(&El1[index]);\n" " PDstandard2El1 = PDstandardfdOrder42(&El1[index]);\n" " PDstandard3El1 = PDstandardfdOrder43(&El1[index]);\n" " PDstandard1El2 = PDstandardfdOrder41(&El2[index]);\n" " PDstandard2El2 = PDstandardfdOrder42(&El2[index]);\n" " PDstandard3El2 = PDstandardfdOrder43(&El2[index]);\n" " PDstandard1El3 = PDstandardfdOrder41(&El3[index]);\n" " PDstandard2El3 = PDstandardfdOrder42(&El3[index]);\n" " PDstandard3El3 = PDstandardfdOrder43(&El3[index]);\n" " break;\n" " }\n" " \n" " /* Calculate temporaries and grid functions */\n" " CCTK_REAL_VEC JacPDstandard1B2;\n" " CCTK_REAL_VEC JacPDstandard1B3;\n" " CCTK_REAL_VEC JacPDstandard1El2;\n" " CCTK_REAL_VEC JacPDstandard1El3;\n" " CCTK_REAL_VEC JacPDstandard2B1;\n" " CCTK_REAL_VEC JacPDstandard2B3;\n" " CCTK_REAL_VEC JacPDstandard2El1;\n" " CCTK_REAL_VEC JacPDstandard2El3;\n" " CCTK_REAL_VEC JacPDstandard3B1;\n" " CCTK_REAL_VEC JacPDstandard3B2;\n" " CCTK_REAL_VEC JacPDstandard3El1;\n" " CCTK_REAL_VEC JacPDstandard3El2;\n" " \n" " if (use_jacobian)\n" " {\n" " JacPDstandard1B2 = \n" " kmadd(J11L,PDstandard1B2,kmadd(J21L,PDstandard2B2,kmul(J31L,PDstandard3B2)));\n" " \n" " JacPDstandard1B3 = \n" " kmadd(J11L,PDstandard1B3,kmadd(J21L,PDstandard2B3,kmul(J31L,PDstandard3B3)));\n" " \n" " JacPDstandard1El2 = \n" " kmadd(J11L,PDstandard1El2,kmadd(J21L,PDstandard2El2,kmul(J31L,PDstandard3El2)));\n" " \n" " JacPDstandard1El3 = \n" " kmadd(J11L,PDstandard1El3,kmadd(J21L,PDstandard2El3,kmul(J31L,PDstandard3El3)));\n" " \n" " JacPDstandard2B1 = \n" " kmadd(J12L,PDstandard1B1,kmadd(J22L,PDstandard2B1,kmul(J32L,PDstandard3B1)));\n" " \n" " JacPDstandard2B3 = \n" " kmadd(J12L,PDstandard1B3,kmadd(J22L,PDstandard2B3,kmul(J32L,PDstandard3B3)));\n" " \n" " JacPDstandard2El1 = \n" " kmadd(J12L,PDstandard1El1,kmadd(J22L,PDstandard2El1,kmul(J32L,PDstandard3El1)));\n" " \n" " JacPDstandard2El3 = \n" " kmadd(J12L,PDstandard1El3,kmadd(J22L,PDstandard2El3,kmul(J32L,PDstandard3El3)));\n" " \n" " JacPDstandard3B1 = \n" " kmadd(J13L,PDstandard1B1,kmadd(J23L,PDstandard2B1,kmul(J33L,PDstandard3B1)));\n" " \n" " JacPDstandard3B2 = \n" " kmadd(J13L,PDstandard1B2,kmadd(J23L,PDstandard2B2,kmul(J33L,PDstandard3B2)));\n" " \n" " JacPDstandard3El1 = \n" " kmadd(J13L,PDstandard1El1,kmadd(J23L,PDstandard2El1,kmul(J33L,PDstandard3El1)));\n" " \n" " JacPDstandard3El2 = \n" " kmadd(J13L,PDstandard1El2,kmadd(J23L,PDstandard2El2,kmul(J33L,PDstandard3El2)));\n" " }\n" " else\n" " {\n" " JacPDstandard1B2 = PDstandard1B2;\n" " \n" " JacPDstandard1B3 = PDstandard1B3;\n" " \n" " JacPDstandard1El2 = PDstandard1El2;\n" " \n" " JacPDstandard1El3 = PDstandard1El3;\n" " \n" " JacPDstandard2B1 = PDstandard2B1;\n" " \n" " JacPDstandard2B3 = PDstandard2B3;\n" " \n" " JacPDstandard2El1 = PDstandard2El1;\n" " \n" " JacPDstandard2El3 = PDstandard2El3;\n" " \n" " JacPDstandard3B1 = PDstandard3B1;\n" " \n" " JacPDstandard3B2 = PDstandard3B2;\n" " \n" " JacPDstandard3El1 = PDstandard3El1;\n" " \n" " JacPDstandard3El2 = PDstandard3El2;\n" " }\n" " \n" " CCTK_REAL_VEC El1rhsL = ksub(JacPDstandard2B3,JacPDstandard3B2);\n" " \n" " CCTK_REAL_VEC El2rhsL = ksub(JacPDstandard3B1,JacPDstandard1B3);\n" " \n" " CCTK_REAL_VEC El3rhsL = ksub(JacPDstandard1B2,JacPDstandard2B1);\n" " \n" " CCTK_REAL_VEC B1rhsL = ksub(JacPDstandard3El2,JacPDstandard2El3);\n" " \n" " CCTK_REAL_VEC B2rhsL = ksub(JacPDstandard1El3,JacPDstandard3El1);\n" " \n" " CCTK_REAL_VEC B3rhsL = ksub(JacPDstandard2El1,JacPDstandard1El2);\n" " \n" " /* Copy local copies back to grid functions */\n" " vec_store_nta_partial(B1rhs[index],B1rhsL);\n" " vec_store_nta_partial(B2rhs[index],B2rhsL);\n" " vec_store_nta_partial(B3rhs[index],B3rhsL);\n" " vec_store_nta_partial(El1rhs[index],El1rhsL);\n" " vec_store_nta_partial(El2rhs[index],El2rhsL);\n" " vec_store_nta_partial(El3rhs[index],El3rhsL);\n" "}\n" "LC_ENDLOOP3VEC (EM_evol);\n" "" ; char const * const groups[] = {"My_New_Implementation::B_group","My_New_Implementation::B_grouprhs","My_New_Implementation::El_group","My_New_Implementation::El_grouprhs",NULL}; static struct OpenCLKernel * kernel = NULL; char const * const sources[] = {differencing, source, NULL}; OpenCLRunTime_CallKernel (cctkGH, CCTK_THORNSTRING, "EM_evol", sources, groups, NULL, NULL, NULL, -1, imin, imax, &kernel); } extern "C" void EM_evol(CCTK_ARGUMENTS) { DECLARE_CCTK_ARGUMENTS; DECLARE_CCTK_PARAMETERS; if (verbose > 1) { CCTK_VInfo(CCTK_THORNSTRING,"Entering EM_evol_Body"); } if (cctk_iteration % EM_evol_calc_every != EM_evol_calc_offset) { return; } const char *groups[] = {"My_New_Implementation::B_group","My_New_Implementation::B_grouprhs","My_New_Implementation::El_group","My_New_Implementation::El_grouprhs"}; GenericFD_AssertGroupStorage(cctkGH, "EM_evol", 4, groups); switch(fdOrder) { case 2: GenericFD_EnsureStencilFits(cctkGH, "EM_evol", 1, 1, 1); break; case 4: GenericFD_EnsureStencilFits(cctkGH, "EM_evol", 2, 2, 2); break; } GenericFD_LoopOverInterior(cctkGH, &EM_evol_Body); if (verbose > 1) { CCTK_VInfo(CCTK_THORNSTRING,"Leaving EM_evol_Body"); } }