diff options
Diffstat (limited to 'ML_BSSN/src/ML_BSSN_RHS1.cc')
-rw-r--r-- | ML_BSSN/src/ML_BSSN_RHS1.cc | 829 |
1 files changed, 437 insertions, 392 deletions
diff --git a/ML_BSSN/src/ML_BSSN_RHS1.cc b/ML_BSSN/src/ML_BSSN_RHS1.cc index 1c2e051..41593a4 100644 --- a/ML_BSSN/src/ML_BSSN_RHS1.cc +++ b/ML_BSSN/src/ML_BSSN_RHS1.cc @@ -13,13 +13,14 @@ #include "GenericFD.h" #include "Differencing.h" #include "loopcontrol.h" +#include "vectors.h" /* Define macros used in calculations */ #define INITVALUE (42) #define QAD(x) (SQR(SQR(x))) -#define INV(x) ((1.0) / (x)) -#define SQR(x) ((x) * (x)) -#define CUB(x) ((x) * (x) * (x)) +#define INV(x) (kdiv(ToReal(1.0),x)) +#define SQR(x) (kmul(x,x)) +#define CUB(x) (kmul(x,SQR(x))) extern "C" void ML_BSSN_RHS1_SelectBCs(CCTK_ARGUMENTS) { @@ -86,93 +87,94 @@ static void ML_BSSN_RHS1_Body(cGH const * restrict const cctkGH, int const dir, ptrdiff_t const cdi = sizeof(CCTK_REAL) * di; ptrdiff_t const cdj = sizeof(CCTK_REAL) * dj; ptrdiff_t const cdk = sizeof(CCTK_REAL) * dk; - CCTK_REAL const dx = ToReal(CCTK_DELTA_SPACE(0)); - CCTK_REAL const dy = ToReal(CCTK_DELTA_SPACE(1)); - CCTK_REAL const dz = ToReal(CCTK_DELTA_SPACE(2)); - CCTK_REAL const dt = ToReal(CCTK_DELTA_TIME); - CCTK_REAL const dxi = INV(dx); - CCTK_REAL const dyi = INV(dy); - CCTK_REAL const dzi = INV(dz); - CCTK_REAL const khalf = 0.5; - CCTK_REAL const kthird = 1/3.0; - CCTK_REAL const ktwothird = 2.0/3.0; - CCTK_REAL const kfourthird = 4.0/3.0; - CCTK_REAL const keightthird = 8.0/3.0; - CCTK_REAL const hdxi = 0.5 * dxi; - CCTK_REAL const hdyi = 0.5 * dyi; - CCTK_REAL const hdzi = 0.5 * dzi; + CCTK_REAL_VEC const dx = ToReal(CCTK_DELTA_SPACE(0)); + CCTK_REAL_VEC const dy = ToReal(CCTK_DELTA_SPACE(1)); + CCTK_REAL_VEC const dz = ToReal(CCTK_DELTA_SPACE(2)); + CCTK_REAL_VEC const dt = ToReal(CCTK_DELTA_TIME); + CCTK_REAL_VEC const dxi = INV(dx); + CCTK_REAL_VEC const dyi = INV(dy); + CCTK_REAL_VEC const dzi = INV(dz); + CCTK_REAL_VEC const khalf = ToReal(0.5); + CCTK_REAL_VEC const kthird = ToReal(1.0/3.0); + CCTK_REAL_VEC const ktwothird = ToReal(2.0/3.0); + CCTK_REAL_VEC const kfourthird = ToReal(4.0/3.0); + CCTK_REAL_VEC const keightthird = ToReal(8.0/3.0); + CCTK_REAL_VEC const hdxi = kmul(ToReal(0.5), dxi); + CCTK_REAL_VEC const hdyi = kmul(ToReal(0.5), dyi); + CCTK_REAL_VEC const hdzi = kmul(ToReal(0.5), dzi); /* Initialize predefined quantities */ - CCTK_REAL const p1o12dx = 0.0833333333333333333333333333333*INV(dx); - CCTK_REAL const p1o12dy = 0.0833333333333333333333333333333*INV(dy); - CCTK_REAL const p1o12dz = 0.0833333333333333333333333333333*INV(dz); - CCTK_REAL const p1o144dxdy = 0.00694444444444444444444444444444*INV(dx)*INV(dy); - CCTK_REAL const p1o144dxdz = 0.00694444444444444444444444444444*INV(dx)*INV(dz); - CCTK_REAL const p1o144dydz = 0.00694444444444444444444444444444*INV(dy)*INV(dz); - CCTK_REAL const p1o24dx = 0.0416666666666666666666666666667*INV(dx); - CCTK_REAL const p1o24dy = 0.0416666666666666666666666666667*INV(dy); - CCTK_REAL const p1o24dz = 0.0416666666666666666666666666667*INV(dz); - CCTK_REAL const p1o64dx = 0.015625*INV(dx); - CCTK_REAL const p1o64dy = 0.015625*INV(dy); - CCTK_REAL const p1o64dz = 0.015625*INV(dz); - CCTK_REAL const p1odx = INV(dx); - CCTK_REAL const p1ody = INV(dy); - CCTK_REAL const p1odz = INV(dz); - CCTK_REAL const pm1o12dx2 = -0.0833333333333333333333333333333*INV(SQR(dx)); - CCTK_REAL const pm1o12dy2 = -0.0833333333333333333333333333333*INV(SQR(dy)); - CCTK_REAL const pm1o12dz2 = -0.0833333333333333333333333333333*INV(SQR(dz)); + CCTK_REAL_VEC const p1o12dx = kmul(INV(dx),ToReal(0.0833333333333333333333333333333)); + CCTK_REAL_VEC const p1o12dy = kmul(INV(dy),ToReal(0.0833333333333333333333333333333)); + CCTK_REAL_VEC const p1o12dz = kmul(INV(dz),ToReal(0.0833333333333333333333333333333)); + CCTK_REAL_VEC const p1o144dxdy = kmul(INV(dx),kmul(INV(dy),ToReal(0.00694444444444444444444444444444))); + CCTK_REAL_VEC const p1o144dxdz = kmul(INV(dx),kmul(INV(dz),ToReal(0.00694444444444444444444444444444))); + CCTK_REAL_VEC const p1o144dydz = kmul(INV(dy),kmul(INV(dz),ToReal(0.00694444444444444444444444444444))); + CCTK_REAL_VEC const p1o24dx = kmul(INV(dx),ToReal(0.0416666666666666666666666666667)); + CCTK_REAL_VEC const p1o24dy = kmul(INV(dy),ToReal(0.0416666666666666666666666666667)); + CCTK_REAL_VEC const p1o24dz = kmul(INV(dz),ToReal(0.0416666666666666666666666666667)); + CCTK_REAL_VEC const p1o64dx = kmul(INV(dx),ToReal(0.015625)); + CCTK_REAL_VEC const p1o64dy = kmul(INV(dy),ToReal(0.015625)); + CCTK_REAL_VEC const p1o64dz = kmul(INV(dz),ToReal(0.015625)); + CCTK_REAL_VEC const p1odx = INV(dx); + CCTK_REAL_VEC const p1ody = INV(dy); + CCTK_REAL_VEC const p1odz = INV(dz); + CCTK_REAL_VEC const pm1o12dx2 = kmul(INV(SQR(dx)),ToReal(-0.0833333333333333333333333333333)); + CCTK_REAL_VEC const pm1o12dy2 = kmul(INV(SQR(dy)),ToReal(-0.0833333333333333333333333333333)); + CCTK_REAL_VEC const pm1o12dz2 = kmul(INV(SQR(dz)),ToReal(-0.0833333333333333333333333333333)); /* Loop over the grid points */ #pragma omp parallel - LC_LOOP3 (ML_BSSN_RHS1, + LC_LOOP3VEC (ML_BSSN_RHS1, i,j,k, min[0],min[1],min[2], max[0],max[1],max[2], - cctk_lsh[0],cctk_lsh[1],cctk_lsh[2]) + cctk_lsh[0],cctk_lsh[1],cctk_lsh[2], + CCTK_REAL_VEC_SIZE) { ptrdiff_t const index = di*i + dj*j + dk*k; /* Assign local copies of grid functions */ - CCTK_REAL AL = A[index]; - CCTK_REAL alphaL = alpha[index]; - CCTK_REAL At11L = At11[index]; - CCTK_REAL At12L = At12[index]; - CCTK_REAL At13L = At13[index]; - CCTK_REAL At22L = At22[index]; - CCTK_REAL At23L = At23[index]; - CCTK_REAL At33L = At33[index]; - CCTK_REAL B1L = B1[index]; - CCTK_REAL B2L = B2[index]; - CCTK_REAL B3L = B3[index]; - CCTK_REAL beta1L = beta1[index]; - CCTK_REAL beta2L = beta2[index]; - CCTK_REAL beta3L = beta3[index]; - CCTK_REAL gt11L = gt11[index]; - CCTK_REAL gt12L = gt12[index]; - CCTK_REAL gt13L = gt13[index]; - CCTK_REAL gt22L = gt22[index]; - CCTK_REAL gt23L = gt23[index]; - CCTK_REAL gt33L = gt33[index]; - CCTK_REAL phiL = phi[index]; - CCTK_REAL rL = r[index]; - CCTK_REAL trKL = trK[index]; - CCTK_REAL Xt1L = Xt1[index]; - CCTK_REAL Xt2L = Xt2[index]; - CCTK_REAL Xt3L = Xt3[index]; - - CCTK_REAL eTttL, eTtxL, eTtyL, eTtzL, eTxxL, eTxyL, eTxzL, eTyyL, eTyzL, eTzzL; + CCTK_REAL_VEC AL = vec_load(A[index]); + CCTK_REAL_VEC alphaL = vec_load(alpha[index]); + CCTK_REAL_VEC At11L = vec_load(At11[index]); + CCTK_REAL_VEC At12L = vec_load(At12[index]); + CCTK_REAL_VEC At13L = vec_load(At13[index]); + CCTK_REAL_VEC At22L = vec_load(At22[index]); + CCTK_REAL_VEC At23L = vec_load(At23[index]); + CCTK_REAL_VEC At33L = vec_load(At33[index]); + CCTK_REAL_VEC B1L = vec_load(B1[index]); + CCTK_REAL_VEC B2L = vec_load(B2[index]); + CCTK_REAL_VEC B3L = vec_load(B3[index]); + CCTK_REAL_VEC beta1L = vec_load(beta1[index]); + CCTK_REAL_VEC beta2L = vec_load(beta2[index]); + CCTK_REAL_VEC beta3L = vec_load(beta3[index]); + CCTK_REAL_VEC gt11L = vec_load(gt11[index]); + CCTK_REAL_VEC gt12L = vec_load(gt12[index]); + CCTK_REAL_VEC gt13L = vec_load(gt13[index]); + CCTK_REAL_VEC gt22L = vec_load(gt22[index]); + CCTK_REAL_VEC gt23L = vec_load(gt23[index]); + CCTK_REAL_VEC gt33L = vec_load(gt33[index]); + CCTK_REAL_VEC phiL = vec_load(phi[index]); + CCTK_REAL_VEC rL = vec_load(r[index]); + CCTK_REAL_VEC trKL = vec_load(trK[index]); + CCTK_REAL_VEC Xt1L = vec_load(Xt1[index]); + CCTK_REAL_VEC Xt2L = vec_load(Xt2[index]); + CCTK_REAL_VEC Xt3L = vec_load(Xt3[index]); + + CCTK_REAL_VEC eTttL, eTtxL, eTtyL, eTtzL, eTxxL, eTxyL, eTxzL, eTyyL, eTyzL, eTzzL; if (*stress_energy_state) { - eTttL = eTtt[index]; - eTtxL = eTtx[index]; - eTtyL = eTty[index]; - eTtzL = eTtz[index]; - eTxxL = eTxx[index]; - eTxyL = eTxy[index]; - eTxzL = eTxz[index]; - eTyyL = eTyy[index]; - eTyzL = eTyz[index]; - eTzzL = eTzz[index]; + eTttL = vec_load(eTtt[index]); + eTtxL = vec_load(eTtx[index]); + eTtyL = vec_load(eTty[index]); + eTtzL = vec_load(eTtz[index]); + eTxxL = vec_load(eTxx[index]); + eTxyL = vec_load(eTxy[index]); + eTxzL = vec_load(eTxz[index]); + eTyyL = vec_load(eTyy[index]); + eTyzL = vec_load(eTyz[index]); + eTzzL = vec_load(eTzz[index]); } else { @@ -191,66 +193,66 @@ static void ML_BSSN_RHS1_Body(cGH const * restrict const cctkGH, int const dir, /* Include user supplied include files */ /* Precompute derivatives */ - CCTK_REAL const PDstandardNth1alpha = PDstandardNth1(&alpha[index]); - CCTK_REAL const PDstandardNth2alpha = PDstandardNth2(&alpha[index]); - CCTK_REAL const PDstandardNth3alpha = PDstandardNth3(&alpha[index]); - CCTK_REAL const PDstandardNth11alpha = PDstandardNth11(&alpha[index]); - CCTK_REAL const PDstandardNth22alpha = PDstandardNth22(&alpha[index]); - CCTK_REAL const PDstandardNth33alpha = PDstandardNth33(&alpha[index]); - CCTK_REAL const PDstandardNth12alpha = PDstandardNth12(&alpha[index]); - CCTK_REAL const PDstandardNth13alpha = PDstandardNth13(&alpha[index]); - CCTK_REAL const PDstandardNth23alpha = PDstandardNth23(&alpha[index]); - CCTK_REAL const PDstandardNth1beta1 = PDstandardNth1(&beta1[index]); - CCTK_REAL const PDstandardNth2beta1 = PDstandardNth2(&beta1[index]); - CCTK_REAL const PDstandardNth3beta1 = PDstandardNth3(&beta1[index]); - CCTK_REAL const PDstandardNth11beta1 = PDstandardNth11(&beta1[index]); - CCTK_REAL const PDstandardNth22beta1 = PDstandardNth22(&beta1[index]); - CCTK_REAL const PDstandardNth33beta1 = PDstandardNth33(&beta1[index]); - CCTK_REAL const PDstandardNth12beta1 = PDstandardNth12(&beta1[index]); - CCTK_REAL const PDstandardNth13beta1 = PDstandardNth13(&beta1[index]); - CCTK_REAL const PDstandardNth23beta1 = PDstandardNth23(&beta1[index]); - CCTK_REAL const PDstandardNth1beta2 = PDstandardNth1(&beta2[index]); - CCTK_REAL const PDstandardNth2beta2 = PDstandardNth2(&beta2[index]); - CCTK_REAL const PDstandardNth3beta2 = PDstandardNth3(&beta2[index]); - CCTK_REAL const PDstandardNth11beta2 = PDstandardNth11(&beta2[index]); - CCTK_REAL const PDstandardNth22beta2 = PDstandardNth22(&beta2[index]); - CCTK_REAL const PDstandardNth33beta2 = PDstandardNth33(&beta2[index]); - CCTK_REAL const PDstandardNth12beta2 = PDstandardNth12(&beta2[index]); - CCTK_REAL const PDstandardNth13beta2 = PDstandardNth13(&beta2[index]); - CCTK_REAL const PDstandardNth23beta2 = PDstandardNth23(&beta2[index]); - CCTK_REAL const PDstandardNth1beta3 = PDstandardNth1(&beta3[index]); - CCTK_REAL const PDstandardNth2beta3 = PDstandardNth2(&beta3[index]); - CCTK_REAL const PDstandardNth3beta3 = PDstandardNth3(&beta3[index]); - CCTK_REAL const PDstandardNth11beta3 = PDstandardNth11(&beta3[index]); - CCTK_REAL const PDstandardNth22beta3 = PDstandardNth22(&beta3[index]); - CCTK_REAL const PDstandardNth33beta3 = PDstandardNth33(&beta3[index]); - CCTK_REAL const PDstandardNth12beta3 = PDstandardNth12(&beta3[index]); - CCTK_REAL const PDstandardNth13beta3 = PDstandardNth13(&beta3[index]); - CCTK_REAL const PDstandardNth23beta3 = PDstandardNth23(&beta3[index]); - CCTK_REAL const PDstandardNth1gt11 = PDstandardNth1(>11[index]); - CCTK_REAL const PDstandardNth2gt11 = PDstandardNth2(>11[index]); - CCTK_REAL const PDstandardNth3gt11 = PDstandardNth3(>11[index]); - CCTK_REAL const PDstandardNth1gt12 = PDstandardNth1(>12[index]); - CCTK_REAL const PDstandardNth2gt12 = PDstandardNth2(>12[index]); - CCTK_REAL const PDstandardNth3gt12 = PDstandardNth3(>12[index]); - CCTK_REAL const PDstandardNth1gt13 = PDstandardNth1(>13[index]); - CCTK_REAL const PDstandardNth2gt13 = PDstandardNth2(>13[index]); - CCTK_REAL const PDstandardNth3gt13 = PDstandardNth3(>13[index]); - CCTK_REAL const PDstandardNth1gt22 = PDstandardNth1(>22[index]); - CCTK_REAL const PDstandardNth2gt22 = PDstandardNth2(>22[index]); - CCTK_REAL const PDstandardNth3gt22 = PDstandardNth3(>22[index]); - CCTK_REAL const PDstandardNth1gt23 = PDstandardNth1(>23[index]); - CCTK_REAL const PDstandardNth2gt23 = PDstandardNth2(>23[index]); - CCTK_REAL const PDstandardNth3gt23 = PDstandardNth3(>23[index]); - CCTK_REAL const PDstandardNth1gt33 = PDstandardNth1(>33[index]); - CCTK_REAL const PDstandardNth2gt33 = PDstandardNth2(>33[index]); - CCTK_REAL const PDstandardNth3gt33 = PDstandardNth3(>33[index]); - CCTK_REAL const PDstandardNth1phi = PDstandardNth1(&phi[index]); - CCTK_REAL const PDstandardNth2phi = PDstandardNth2(&phi[index]); - CCTK_REAL const PDstandardNth3phi = PDstandardNth3(&phi[index]); - CCTK_REAL const PDstandardNth1trK = PDstandardNth1(&trK[index]); - CCTK_REAL const PDstandardNth2trK = PDstandardNth2(&trK[index]); - CCTK_REAL const PDstandardNth3trK = PDstandardNth3(&trK[index]); + CCTK_REAL_VEC const PDstandardNth1alpha = PDstandardNth1(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth2alpha = PDstandardNth2(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth3alpha = PDstandardNth3(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth11alpha = PDstandardNth11(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth22alpha = PDstandardNth22(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth33alpha = PDstandardNth33(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth12alpha = PDstandardNth12(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth13alpha = PDstandardNth13(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth23alpha = PDstandardNth23(&alpha[index]); + CCTK_REAL_VEC const PDstandardNth1beta1 = PDstandardNth1(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth2beta1 = PDstandardNth2(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth3beta1 = PDstandardNth3(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth11beta1 = PDstandardNth11(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth22beta1 = PDstandardNth22(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth33beta1 = PDstandardNth33(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth12beta1 = PDstandardNth12(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth13beta1 = PDstandardNth13(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth23beta1 = PDstandardNth23(&beta1[index]); + CCTK_REAL_VEC const PDstandardNth1beta2 = PDstandardNth1(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth2beta2 = PDstandardNth2(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth3beta2 = PDstandardNth3(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth11beta2 = PDstandardNth11(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth22beta2 = PDstandardNth22(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth33beta2 = PDstandardNth33(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth12beta2 = PDstandardNth12(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth13beta2 = PDstandardNth13(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth23beta2 = PDstandardNth23(&beta2[index]); + CCTK_REAL_VEC const PDstandardNth1beta3 = PDstandardNth1(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth2beta3 = PDstandardNth2(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth3beta3 = PDstandardNth3(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth11beta3 = PDstandardNth11(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth22beta3 = PDstandardNth22(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth33beta3 = PDstandardNth33(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth12beta3 = PDstandardNth12(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth13beta3 = PDstandardNth13(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth23beta3 = PDstandardNth23(&beta3[index]); + CCTK_REAL_VEC const PDstandardNth1gt11 = PDstandardNth1(>11[index]); + CCTK_REAL_VEC const PDstandardNth2gt11 = PDstandardNth2(>11[index]); + CCTK_REAL_VEC const PDstandardNth3gt11 = PDstandardNth3(>11[index]); + CCTK_REAL_VEC const PDstandardNth1gt12 = PDstandardNth1(>12[index]); + CCTK_REAL_VEC const PDstandardNth2gt12 = PDstandardNth2(>12[index]); + CCTK_REAL_VEC const PDstandardNth3gt12 = PDstandardNth3(>12[index]); + CCTK_REAL_VEC const PDstandardNth1gt13 = PDstandardNth1(>13[index]); + CCTK_REAL_VEC const PDstandardNth2gt13 = PDstandardNth2(>13[index]); + CCTK_REAL_VEC const PDstandardNth3gt13 = PDstandardNth3(>13[index]); + CCTK_REAL_VEC const PDstandardNth1gt22 = PDstandardNth1(>22[index]); + CCTK_REAL_VEC const PDstandardNth2gt22 = PDstandardNth2(>22[index]); + CCTK_REAL_VEC const PDstandardNth3gt22 = PDstandardNth3(>22[index]); + CCTK_REAL_VEC const PDstandardNth1gt23 = PDstandardNth1(>23[index]); + CCTK_REAL_VEC const PDstandardNth2gt23 = PDstandardNth2(>23[index]); + CCTK_REAL_VEC const PDstandardNth3gt23 = PDstandardNth3(>23[index]); + CCTK_REAL_VEC const PDstandardNth1gt33 = PDstandardNth1(>33[index]); + CCTK_REAL_VEC const PDstandardNth2gt33 = PDstandardNth2(>33[index]); + CCTK_REAL_VEC const PDstandardNth3gt33 = PDstandardNth3(>33[index]); + CCTK_REAL_VEC const PDstandardNth1phi = PDstandardNth1(&phi[index]); + CCTK_REAL_VEC const PDstandardNth2phi = PDstandardNth2(&phi[index]); + CCTK_REAL_VEC const PDstandardNth3phi = PDstandardNth3(&phi[index]); + CCTK_REAL_VEC const PDstandardNth1trK = PDstandardNth1(&trK[index]); + CCTK_REAL_VEC const PDstandardNth2trK = PDstandardNth2(&trK[index]); + CCTK_REAL_VEC const PDstandardNth3trK = PDstandardNth3(&trK[index]); /* Calculate temporaries and grid functions */ ptrdiff_t dir1 = Sign(beta1L); @@ -259,340 +261,383 @@ static void ML_BSSN_RHS1_Body(cGH const * restrict const cctkGH, int const dir, ptrdiff_t dir3 = Sign(beta3L); - CCTK_REAL detgt = 1; + CCTK_REAL_VEC detgt = ToReal(1); - CCTK_REAL gtu11 = INV(detgt)*(gt22L*gt33L - SQR(gt23L)); + CCTK_REAL_VEC gtu11 = kmul(INV(detgt),kmsub(gt22L,gt33L,SQR(gt23L))); - CCTK_REAL gtu12 = (gt13L*gt23L - gt12L*gt33L)*INV(detgt); + CCTK_REAL_VEC gtu12 = + kmul(INV(detgt),kmsub(gt13L,gt23L,kmul(gt12L,gt33L))); - CCTK_REAL gtu13 = (-(gt13L*gt22L) + gt12L*gt23L)*INV(detgt); + CCTK_REAL_VEC gtu13 = + kmul(INV(detgt),kmsub(gt12L,gt23L,kmul(gt13L,gt22L))); - CCTK_REAL gtu22 = INV(detgt)*(gt11L*gt33L - SQR(gt13L)); + CCTK_REAL_VEC gtu22 = kmul(INV(detgt),kmsub(gt11L,gt33L,SQR(gt13L))); - CCTK_REAL gtu23 = (gt12L*gt13L - gt11L*gt23L)*INV(detgt); + CCTK_REAL_VEC gtu23 = + kmul(INV(detgt),kmsub(gt12L,gt13L,kmul(gt11L,gt23L))); - CCTK_REAL gtu33 = INV(detgt)*(gt11L*gt22L - SQR(gt12L)); + CCTK_REAL_VEC gtu33 = kmul(INV(detgt),kmsub(gt11L,gt22L,SQR(gt12L))); - CCTK_REAL Gtl111 = 0.5*PDstandardNth1gt11; + CCTK_REAL_VEC Gtl111 = kmul(PDstandardNth1gt11,ToReal(0.5)); - CCTK_REAL Gtl112 = 0.5*PDstandardNth2gt11; + CCTK_REAL_VEC Gtl112 = kmul(PDstandardNth2gt11,ToReal(0.5)); - CCTK_REAL Gtl113 = 0.5*PDstandardNth3gt11; + CCTK_REAL_VEC Gtl113 = kmul(PDstandardNth3gt11,ToReal(0.5)); - CCTK_REAL Gtl122 = -0.5*PDstandardNth1gt22 + PDstandardNth2gt12; + CCTK_REAL_VEC Gtl122 = + kmadd(PDstandardNth1gt22,ToReal(-0.5),PDstandardNth2gt12); - CCTK_REAL Gtl123 = 0.5*(-PDstandardNth1gt23 + PDstandardNth2gt13 + - PDstandardNth3gt12); + CCTK_REAL_VEC Gtl123 = + kmul(kadd(PDstandardNth2gt13,ksub(PDstandardNth3gt12,PDstandardNth1gt23)),ToReal(0.5)); - CCTK_REAL Gtl133 = -0.5*PDstandardNth1gt33 + PDstandardNth3gt13; + CCTK_REAL_VEC Gtl133 = + kmadd(PDstandardNth1gt33,ToReal(-0.5),PDstandardNth3gt13); - CCTK_REAL Gtl211 = PDstandardNth1gt12 - 0.5*PDstandardNth2gt11; + CCTK_REAL_VEC Gtl211 = + kmadd(PDstandardNth2gt11,ToReal(-0.5),PDstandardNth1gt12); - CCTK_REAL Gtl212 = 0.5*PDstandardNth1gt22; + CCTK_REAL_VEC Gtl212 = kmul(PDstandardNth1gt22,ToReal(0.5)); - CCTK_REAL Gtl213 = 0.5*(PDstandardNth1gt23 - PDstandardNth2gt13 + - PDstandardNth3gt12); + CCTK_REAL_VEC Gtl213 = + kmul(kadd(PDstandardNth1gt23,ksub(PDstandardNth3gt12,PDstandardNth2gt13)),ToReal(0.5)); - CCTK_REAL Gtl222 = 0.5*PDstandardNth2gt22; + CCTK_REAL_VEC Gtl222 = kmul(PDstandardNth2gt22,ToReal(0.5)); - CCTK_REAL Gtl223 = 0.5*PDstandardNth3gt22; + CCTK_REAL_VEC Gtl223 = kmul(PDstandardNth3gt22,ToReal(0.5)); - CCTK_REAL Gtl233 = -0.5*PDstandardNth2gt33 + PDstandardNth3gt23; + CCTK_REAL_VEC Gtl233 = + kmadd(PDstandardNth2gt33,ToReal(-0.5),PDstandardNth3gt23); - CCTK_REAL Gtl311 = PDstandardNth1gt13 - 0.5*PDstandardNth3gt11; + CCTK_REAL_VEC Gtl311 = + kmadd(PDstandardNth3gt11,ToReal(-0.5),PDstandardNth1gt13); - CCTK_REAL Gtl312 = 0.5*(PDstandardNth1gt23 + PDstandardNth2gt13 - - PDstandardNth3gt12); + CCTK_REAL_VEC Gtl312 = + kmul(kadd(PDstandardNth1gt23,ksub(PDstandardNth2gt13,PDstandardNth3gt12)),ToReal(0.5)); - CCTK_REAL Gtl313 = 0.5*PDstandardNth1gt33; + CCTK_REAL_VEC Gtl313 = kmul(PDstandardNth1gt33,ToReal(0.5)); - CCTK_REAL Gtl322 = PDstandardNth2gt23 - 0.5*PDstandardNth3gt22; + CCTK_REAL_VEC Gtl322 = + kmadd(PDstandardNth3gt22,ToReal(-0.5),PDstandardNth2gt23); - CCTK_REAL Gtl323 = 0.5*PDstandardNth2gt33; + CCTK_REAL_VEC Gtl323 = kmul(PDstandardNth2gt33,ToReal(0.5)); - CCTK_REAL Gtl333 = 0.5*PDstandardNth3gt33; + CCTK_REAL_VEC Gtl333 = kmul(PDstandardNth3gt33,ToReal(0.5)); - CCTK_REAL Gt111 = Gtl111*gtu11 + Gtl211*gtu12 + Gtl311*gtu13; + CCTK_REAL_VEC Gt111 = + kmadd(Gtl111,gtu11,kmadd(Gtl211,gtu12,kmul(Gtl311,gtu13))); - CCTK_REAL Gt211 = Gtl111*gtu12 + Gtl211*gtu22 + Gtl311*gtu23; + CCTK_REAL_VEC Gt211 = + kmadd(Gtl111,gtu12,kmadd(Gtl211,gtu22,kmul(Gtl311,gtu23))); - CCTK_REAL Gt311 = Gtl111*gtu13 + Gtl211*gtu23 + Gtl311*gtu33; + CCTK_REAL_VEC Gt311 = + kmadd(Gtl111,gtu13,kmadd(Gtl211,gtu23,kmul(Gtl311,gtu33))); - CCTK_REAL Gt112 = Gtl112*gtu11 + Gtl212*gtu12 + Gtl312*gtu13; + CCTK_REAL_VEC Gt112 = + kmadd(Gtl112,gtu11,kmadd(Gtl212,gtu12,kmul(Gtl312,gtu13))); - CCTK_REAL Gt212 = Gtl112*gtu12 + Gtl212*gtu22 + Gtl312*gtu23; + CCTK_REAL_VEC Gt212 = + kmadd(Gtl112,gtu12,kmadd(Gtl212,gtu22,kmul(Gtl312,gtu23))); - CCTK_REAL Gt312 = Gtl112*gtu13 + Gtl212*gtu23 + Gtl312*gtu33; + CCTK_REAL_VEC Gt312 = + kmadd(Gtl112,gtu13,kmadd(Gtl212,gtu23,kmul(Gtl312,gtu33))); - CCTK_REAL Gt113 = Gtl113*gtu11 + Gtl213*gtu12 + Gtl313*gtu13; + CCTK_REAL_VEC Gt113 = + kmadd(Gtl113,gtu11,kmadd(Gtl213,gtu12,kmul(Gtl313,gtu13))); - CCTK_REAL Gt213 = Gtl113*gtu12 + Gtl213*gtu22 + Gtl313*gtu23; + CCTK_REAL_VEC Gt213 = + kmadd(Gtl113,gtu12,kmadd(Gtl213,gtu22,kmul(Gtl313,gtu23))); - CCTK_REAL Gt313 = Gtl113*gtu13 + Gtl213*gtu23 + Gtl313*gtu33; + CCTK_REAL_VEC Gt313 = + kmadd(Gtl113,gtu13,kmadd(Gtl213,gtu23,kmul(Gtl313,gtu33))); - CCTK_REAL Gt122 = Gtl122*gtu11 + Gtl222*gtu12 + Gtl322*gtu13; + CCTK_REAL_VEC Gt122 = + kmadd(Gtl122,gtu11,kmadd(Gtl222,gtu12,kmul(Gtl322,gtu13))); - CCTK_REAL Gt222 = Gtl122*gtu12 + Gtl222*gtu22 + Gtl322*gtu23; + CCTK_REAL_VEC Gt222 = + kmadd(Gtl122,gtu12,kmadd(Gtl222,gtu22,kmul(Gtl322,gtu23))); - CCTK_REAL Gt322 = Gtl122*gtu13 + Gtl222*gtu23 + Gtl322*gtu33; + CCTK_REAL_VEC Gt322 = + kmadd(Gtl122,gtu13,kmadd(Gtl222,gtu23,kmul(Gtl322,gtu33))); - CCTK_REAL Gt123 = Gtl123*gtu11 + Gtl223*gtu12 + Gtl323*gtu13; + CCTK_REAL_VEC Gt123 = + kmadd(Gtl123,gtu11,kmadd(Gtl223,gtu12,kmul(Gtl323,gtu13))); - CCTK_REAL Gt223 = Gtl123*gtu12 + Gtl223*gtu22 + Gtl323*gtu23; + CCTK_REAL_VEC Gt223 = + kmadd(Gtl123,gtu12,kmadd(Gtl223,gtu22,kmul(Gtl323,gtu23))); - CCTK_REAL Gt323 = Gtl123*gtu13 + Gtl223*gtu23 + Gtl323*gtu33; + CCTK_REAL_VEC Gt323 = + kmadd(Gtl123,gtu13,kmadd(Gtl223,gtu23,kmul(Gtl323,gtu33))); - CCTK_REAL Gt133 = Gtl133*gtu11 + Gtl233*gtu12 + Gtl333*gtu13; + CCTK_REAL_VEC Gt133 = + kmadd(Gtl133,gtu11,kmadd(Gtl233,gtu12,kmul(Gtl333,gtu13))); - CCTK_REAL Gt233 = Gtl133*gtu12 + Gtl233*gtu22 + Gtl333*gtu23; + CCTK_REAL_VEC Gt233 = + kmadd(Gtl133,gtu12,kmadd(Gtl233,gtu22,kmul(Gtl333,gtu23))); - CCTK_REAL Gt333 = Gtl133*gtu13 + Gtl233*gtu23 + Gtl333*gtu33; + CCTK_REAL_VEC Gt333 = + kmadd(Gtl133,gtu13,kmadd(Gtl233,gtu23,kmul(Gtl333,gtu33))); - CCTK_REAL Xtn1 = Gt111*gtu11 + Gt122*gtu22 + 2*(Gt112*gtu12 + - Gt113*gtu13 + Gt123*gtu23) + Gt133*gtu33; + CCTK_REAL_VEC Xtn1 = + kmadd(Gt111,gtu11,kmadd(Gt122,gtu22,kmadd(Gt133,gtu33,kmul(kmadd(Gt112,gtu12,kmadd(Gt113,gtu13,kmul(Gt123,gtu23))),ToReal(2))))); - CCTK_REAL Xtn2 = Gt211*gtu11 + Gt222*gtu22 + 2*(Gt212*gtu12 + - Gt213*gtu13 + Gt223*gtu23) + Gt233*gtu33; + CCTK_REAL_VEC Xtn2 = + kmadd(Gt211,gtu11,kmadd(Gt222,gtu22,kmadd(Gt233,gtu33,kmul(kmadd(Gt212,gtu12,kmadd(Gt213,gtu13,kmul(Gt223,gtu23))),ToReal(2))))); - CCTK_REAL Xtn3 = Gt311*gtu11 + Gt322*gtu22 + 2*(Gt312*gtu12 + - Gt313*gtu13 + Gt323*gtu23) + Gt333*gtu33; + CCTK_REAL_VEC Xtn3 = + kmadd(Gt311,gtu11,kmadd(Gt322,gtu22,kmadd(Gt333,gtu33,kmul(kmadd(Gt312,gtu12,kmadd(Gt313,gtu13,kmul(Gt323,gtu23))),ToReal(2))))); - CCTK_REAL fac1 = IfThen(conformalMethod,-0.5*INV(phiL),1); + CCTK_REAL_VEC fac1 = + IfThen(conformalMethod,kmul(INV(phiL),ToReal(-0.5)),ToReal(1)); - CCTK_REAL cdphi1 = fac1*PDstandardNth1phi; + CCTK_REAL_VEC cdphi1 = kmul(fac1,PDstandardNth1phi); - CCTK_REAL cdphi2 = fac1*PDstandardNth2phi; + CCTK_REAL_VEC cdphi2 = kmul(fac1,PDstandardNth2phi); - CCTK_REAL cdphi3 = fac1*PDstandardNth3phi; + CCTK_REAL_VEC cdphi3 = kmul(fac1,PDstandardNth3phi); - CCTK_REAL Atm11 = At11L*gtu11 + At12L*gtu12 + At13L*gtu13; + CCTK_REAL_VEC Atm11 = + kmadd(At11L,gtu11,kmadd(At12L,gtu12,kmul(At13L,gtu13))); - CCTK_REAL Atm21 = At11L*gtu12 + At12L*gtu22 + At13L*gtu23; + CCTK_REAL_VEC Atm21 = + kmadd(At11L,gtu12,kmadd(At12L,gtu22,kmul(At13L,gtu23))); - CCTK_REAL Atm31 = At11L*gtu13 + At12L*gtu23 + At13L*gtu33; + CCTK_REAL_VEC Atm31 = + kmadd(At11L,gtu13,kmadd(At12L,gtu23,kmul(At13L,gtu33))); - CCTK_REAL Atm12 = At12L*gtu11 + At22L*gtu12 + At23L*gtu13; + CCTK_REAL_VEC Atm12 = + kmadd(At12L,gtu11,kmadd(At22L,gtu12,kmul(At23L,gtu13))); - CCTK_REAL Atm22 = At12L*gtu12 + At22L*gtu22 + At23L*gtu23; + CCTK_REAL_VEC Atm22 = + kmadd(At12L,gtu12,kmadd(At22L,gtu22,kmul(At23L,gtu23))); - CCTK_REAL Atm32 = At12L*gtu13 + At22L*gtu23 + At23L*gtu33; + CCTK_REAL_VEC Atm32 = + kmadd(At12L,gtu13,kmadd(At22L,gtu23,kmul(At23L,gtu33))); - CCTK_REAL Atm13 = At13L*gtu11 + At23L*gtu12 + At33L*gtu13; + CCTK_REAL_VEC Atm13 = + kmadd(At13L,gtu11,kmadd(At23L,gtu12,kmul(At33L,gtu13))); - CCTK_REAL Atm23 = At13L*gtu12 + At23L*gtu22 + At33L*gtu23; + CCTK_REAL_VEC Atm23 = + kmadd(At13L,gtu12,kmadd(At23L,gtu22,kmul(At33L,gtu23))); - CCTK_REAL Atm33 = At13L*gtu13 + At23L*gtu23 + At33L*gtu33; + CCTK_REAL_VEC Atm33 = + kmadd(At13L,gtu13,kmadd(At23L,gtu23,kmul(At33L,gtu33))); - CCTK_REAL Atu11 = Atm11*gtu11 + Atm12*gtu12 + Atm13*gtu13; + CCTK_REAL_VEC Atu11 = + kmadd(Atm11,gtu11,kmadd(Atm12,gtu12,kmul(Atm13,gtu13))); - CCTK_REAL Atu12 = Atm11*gtu12 + Atm12*gtu22 + Atm13*gtu23; + CCTK_REAL_VEC Atu12 = + kmadd(Atm11,gtu12,kmadd(Atm12,gtu22,kmul(Atm13,gtu23))); - CCTK_REAL Atu13 = Atm11*gtu13 + Atm12*gtu23 + Atm13*gtu33; + CCTK_REAL_VEC Atu13 = + kmadd(Atm11,gtu13,kmadd(Atm12,gtu23,kmul(Atm13,gtu33))); - CCTK_REAL Atu22 = Atm21*gtu12 + Atm22*gtu22 + Atm23*gtu23; + CCTK_REAL_VEC Atu22 = + kmadd(Atm21,gtu12,kmadd(Atm22,gtu22,kmul(Atm23,gtu23))); - CCTK_REAL Atu23 = Atm21*gtu13 + Atm22*gtu23 + Atm23*gtu33; + CCTK_REAL_VEC Atu23 = + kmadd(Atm21,gtu13,kmadd(Atm22,gtu23,kmul(Atm23,gtu33))); - CCTK_REAL Atu33 = Atm31*gtu13 + Atm32*gtu23 + Atm33*gtu33; + CCTK_REAL_VEC Atu33 = + kmadd(Atm31,gtu13,kmadd(Atm32,gtu23,kmul(Atm33,gtu33))); - CCTK_REAL e4phi = IfThen(conformalMethod,INV(SQR(phiL)),exp(4*phiL)); + CCTK_REAL_VEC e4phi = + IfThen(conformalMethod,INV(SQR(phiL)),kexp(kmul(phiL,ToReal(4)))); - CCTK_REAL em4phi = INV(e4phi); + CCTK_REAL_VEC em4phi = INV(e4phi); - CCTK_REAL rho = INV(SQR(alphaL))*(eTttL - 2*(beta2L*eTtyL + - beta3L*eTtzL) + 2*(beta1L*(-eTtxL + beta2L*eTxyL + beta3L*eTxzL) + - beta2L*beta3L*eTyzL) + eTxxL*SQR(beta1L) + eTyyL*SQR(beta2L) + - eTzzL*SQR(beta3L)); + CCTK_REAL_VEC rho = + kmul(INV(SQR(alphaL)),kadd(eTttL,kmadd(eTxxL,SQR(beta1L),kmadd(eTyyL,SQR(beta2L),kmadd(eTzzL,SQR(beta3L),kmadd(kmadd(beta2L,eTtyL,kmul(beta3L,eTtzL)),ToReal(-2),kmul(kmadd(beta2L,kmul(beta3L,eTyzL),kmul(beta1L,kmadd(beta2L,eTxyL,kmsub(beta3L,eTxzL,eTtxL)))),ToReal(2)))))))); - CCTK_REAL S1 = (-eTtxL + beta1L*eTxxL + beta2L*eTxyL + - beta3L*eTxzL)*INV(alphaL); + CCTK_REAL_VEC S1 = + kmul(INV(alphaL),kmadd(beta1L,eTxxL,kmadd(beta2L,eTxyL,kmsub(beta3L,eTxzL,eTtxL)))); - CCTK_REAL S2 = (-eTtyL + beta1L*eTxyL + beta2L*eTyyL + - beta3L*eTyzL)*INV(alphaL); + CCTK_REAL_VEC S2 = + kmul(INV(alphaL),kmadd(beta1L,eTxyL,kmadd(beta2L,eTyyL,kmsub(beta3L,eTyzL,eTtyL)))); - CCTK_REAL S3 = (-eTtzL + beta1L*eTxzL + beta2L*eTyzL + - beta3L*eTzzL)*INV(alphaL); + CCTK_REAL_VEC S3 = + kmul(INV(alphaL),kmadd(beta1L,eTxzL,kmadd(beta2L,eTyzL,kmsub(beta3L,eTzzL,eTtzL)))); - CCTK_REAL trS = em4phi*(eTxxL*gtu11 + eTyyL*gtu22 + 2*(eTxyL*gtu12 + - eTxzL*gtu13 + eTyzL*gtu23) + eTzzL*gtu33); + CCTK_REAL_VEC trS = + kmul(em4phi,kmadd(eTxxL,gtu11,kmadd(eTyyL,gtu22,kmadd(eTzzL,gtu33,kmul(kmadd(eTxyL,gtu12,kmadd(eTxzL,gtu13,kmul(eTyzL,gtu23))),ToReal(2)))))); - CCTK_REAL phirhsL = - IfThen(conformalMethod,phiL*(-0.333333333333333333333333333333*(PDstandardNth1beta1 - + PDstandardNth2beta2 + PDstandardNth3beta3) + - 0.333333333333333333333333333333*alphaL*trKL),0.166666666666666666666666666667*(PDstandardNth1beta1 - + PDstandardNth2beta2 + PDstandardNth3beta3) - - 0.166666666666666666666666666667*alphaL*trKL); + CCTK_REAL_VEC phirhsL = + IfThen(conformalMethod,kmul(phiL,kmadd(kadd(PDstandardNth1beta1,kadd(PDstandardNth2beta2,PDstandardNth3beta3)),ToReal(-0.333333333333333333333333333333),kmul(alphaL,kmul(trKL,ToReal(0.333333333333333333333333333333))))),kmadd(alphaL,kmul(trKL,ToReal(-0.166666666666666666666666666667)),kmul(kadd(PDstandardNth1beta1,kadd(PDstandardNth2beta2,PDstandardNth3beta3)),ToReal(0.166666666666666666666666666667)))); - CCTK_REAL gt11rhsL = -0.666666666666666666666666666667*(3*alphaL*At11L - - 3*(gt12L*PDstandardNth1beta2 + gt13L*PDstandardNth1beta3) + - gt11L*(-2*PDstandardNth1beta1 + PDstandardNth2beta2 + - PDstandardNth3beta3)); + CCTK_REAL_VEC gt11rhsL = + kmul(ToReal(-0.666666666666666666666666666667),kmadd(kmadd(gt12L,PDstandardNth1beta2,kmul(gt13L,PDstandardNth1beta3)),ToReal(-3),kmadd(gt11L,kadd(PDstandardNth2beta2,kmadd(PDstandardNth1beta1,ToReal(-2),PDstandardNth3beta3)),kmul(alphaL,kmul(At11L,ToReal(3)))))); - CCTK_REAL gt12rhsL = 0.333333333333333333333333333333*(-6*alphaL*At12L - + 3*(gt22L*PDstandardNth1beta2 + gt23L*PDstandardNth1beta3 + - gt11L*PDstandardNth2beta1 + gt13L*PDstandardNth2beta3) + - gt12L*(PDstandardNth1beta1 + PDstandardNth2beta2 - - 2*PDstandardNth3beta3)); + CCTK_REAL_VEC gt12rhsL = + kmul(ToReal(0.333333333333333333333333333333),kmadd(alphaL,kmul(At12L,ToReal(-6)),kmadd(gt12L,kadd(PDstandardNth1beta1,kmadd(PDstandardNth3beta3,ToReal(-2),PDstandardNth2beta2)),kmul(kmadd(gt22L,PDstandardNth1beta2,kmadd(gt23L,PDstandardNth1beta3,kmadd(gt11L,PDstandardNth2beta1,kmul(gt13L,PDstandardNth2beta3)))),ToReal(3))))); - CCTK_REAL gt13rhsL = 0.333333333333333333333333333333*(-6*alphaL*At13L - + 3*(gt23L*PDstandardNth1beta2 + gt33L*PDstandardNth1beta3 + - gt11L*PDstandardNth3beta1 + gt12L*PDstandardNth3beta2) + - gt13L*(PDstandardNth1beta1 - 2*PDstandardNth2beta2 + - PDstandardNth3beta3)); - - CCTK_REAL gt22rhsL = -0.666666666666666666666666666667*(3*alphaL*At22L - - 3*(gt12L*PDstandardNth2beta1 + gt23L*PDstandardNth2beta3) + - gt22L*(PDstandardNth1beta1 - 2*PDstandardNth2beta2 + - PDstandardNth3beta3)); - - CCTK_REAL gt23rhsL = 0.333333333333333333333333333333*(-6*alphaL*At23L - + 3*(gt13L*PDstandardNth2beta1 + gt33L*PDstandardNth2beta3 + - gt12L*PDstandardNth3beta1 + gt22L*PDstandardNth3beta2) + - gt23L*(-2*PDstandardNth1beta1 + PDstandardNth2beta2 + - PDstandardNth3beta3)); - - CCTK_REAL gt33rhsL = -0.666666666666666666666666666667*(3*alphaL*At33L - - 3*(gt13L*PDstandardNth3beta1 + gt23L*PDstandardNth3beta2) + - gt33L*(PDstandardNth1beta1 + PDstandardNth2beta2 - - 2*PDstandardNth3beta3)); - - CCTK_REAL dotXt1 = - 0.333333333333333333333333333333*(7*(gtu12*PDstandardNth12beta1 + - gtu13*PDstandardNth13beta1) + 6*gtu23*PDstandardNth23beta1 + - 3*(gtu22*PDstandardNth22beta1 + gtu33*PDstandardNth33beta1) - - 6*(Atu11*PDstandardNth1alpha + Atu12*PDstandardNth2alpha + - Atu13*PDstandardNth3alpha) + gtu11*(4*PDstandardNth11beta1 + - PDstandardNth12beta2 + PDstandardNth13beta3 - - 150.7964473723100754462068823974161384415*alphaL*S1) + - gtu12*(PDstandardNth22beta2 + PDstandardNth23beta3 - - 150.7964473723100754462068823974161384415*alphaL*S2) + - gtu13*(PDstandardNth23beta2 + PDstandardNth33beta3 - - 150.7964473723100754462068823974161384415*alphaL*S3) + - (-PDstandardNth1beta1 + 2*PDstandardNth3beta3)*Xtn1 + - 2*(alphaL*(18*(Atu11*cdphi1 + Atu12*cdphi2 + Atu13*cdphi3) + - 6*(Atu12*Gt112 + Atu13*Gt113 + Atu23*Gt123) + 3*(Atu11*Gt111 + - Atu22*Gt122 + Atu33*Gt133) - 2*(gtu11*PDstandardNth1trK + - gtu12*PDstandardNth2trK + gtu13*PDstandardNth3trK)) + - PDstandardNth2beta2*Xtn1) - 3*(PDstandardNth2beta1*Xtn2 + - PDstandardNth3beta1*Xtn3)); - - CCTK_REAL dotXt2 = - 0.333333333333333333333333333333*(6*gtu13*PDstandardNth13beta2 + - 3*(gtu11*PDstandardNth11beta2 + gtu33*PDstandardNth33beta2) - - 6*(Atu12*PDstandardNth1alpha + Atu22*PDstandardNth2alpha + - Atu23*PDstandardNth3alpha) + gtu12*(PDstandardNth11beta1 + - 7*PDstandardNth12beta2 + PDstandardNth13beta3 - - 150.7964473723100754462068823974161384415*alphaL*S1) + - gtu22*(PDstandardNth12beta1 + 4*PDstandardNth22beta2 + - PDstandardNth23beta3 - - 150.7964473723100754462068823974161384415*alphaL*S2) + - gtu23*(PDstandardNth13beta1 + 7*PDstandardNth23beta2 + - PDstandardNth33beta3 - - 150.7964473723100754462068823974161384415*alphaL*S3) + - (-PDstandardNth2beta2 + 2*PDstandardNth3beta3)*Xtn2 + - 2*(alphaL*(18*(Atu12*cdphi1 + Atu22*cdphi2 + Atu23*cdphi3) + - 6*(Atu12*Gt212 + Atu13*Gt213 + Atu23*Gt223) + 3*(Atu11*Gt211 + - Atu22*Gt222 + Atu33*Gt233) - 2*(gtu12*PDstandardNth1trK + - gtu22*PDstandardNth2trK + gtu23*PDstandardNth3trK)) + - PDstandardNth1beta1*Xtn2) - 3*(PDstandardNth1beta2*Xtn1 + - PDstandardNth3beta2*Xtn3)); - - CCTK_REAL dotXt3 = - 0.333333333333333333333333333333*(6*gtu12*PDstandardNth12beta3 + - 3*(gtu11*PDstandardNth11beta3 + gtu22*PDstandardNth22beta3) - - 6*(Atu13*PDstandardNth1alpha + Atu23*PDstandardNth2alpha + - Atu33*PDstandardNth3alpha) + gtu13*(PDstandardNth11beta1 + - PDstandardNth12beta2 + 7*PDstandardNth13beta3 - - 150.7964473723100754462068823974161384415*alphaL*S1) + - gtu23*(PDstandardNth12beta1 + PDstandardNth22beta2 + - 7*PDstandardNth23beta3 - - 150.7964473723100754462068823974161384415*alphaL*S2) + - gtu33*(PDstandardNth13beta1 + PDstandardNth23beta2 + - 4*PDstandardNth33beta3 - - 150.7964473723100754462068823974161384415*alphaL*S3) - - 3*(PDstandardNth1beta3*Xtn1 + PDstandardNth2beta3*Xtn2) + - (2*PDstandardNth2beta2 - PDstandardNth3beta3)*Xtn3 + - 2*(alphaL*(18*(Atu13*cdphi1 + Atu23*cdphi2 + Atu33*cdphi3) + - 6*(Atu12*Gt312 + Atu13*Gt313 + Atu23*Gt323) + 3*(Atu11*Gt311 + - Atu22*Gt322 + Atu33*Gt333) - 2*(gtu13*PDstandardNth1trK + - gtu23*PDstandardNth2trK + gtu33*PDstandardNth3trK)) + - PDstandardNth1beta1*Xtn3)); - - CCTK_REAL Xt1rhsL = dotXt1; - - CCTK_REAL Xt2rhsL = dotXt2; - - CCTK_REAL Xt3rhsL = dotXt3; - - CCTK_REAL dottrK = -(em4phi*(gtu11*PDstandardNth11alpha + - gtu22*PDstandardNth22alpha + gtu33*(PDstandardNth33alpha + - 2*cdphi3*PDstandardNth3alpha) + 2*(gtu12*PDstandardNth12alpha + - gtu13*(PDstandardNth13alpha + cdphi1*PDstandardNth3alpha) + - gtu23*(PDstandardNth23alpha + cdphi2*PDstandardNth3alpha)) + - PDstandardNth1alpha*(2*(cdphi1*gtu11 + cdphi2*gtu12 + cdphi3*gtu13) - - Xtn1) + PDstandardNth2alpha*(2*(cdphi1*gtu12 + cdphi2*gtu22 + - cdphi3*gtu23) - Xtn2) - PDstandardNth3alpha*Xtn3)) + - alphaL*(2*(Atm12*Atm21 + Atm13*Atm31 + Atm23*Atm32) + - 12.56637061435917295385057353311801153679*(rho + trS) + SQR(Atm11) + - SQR(Atm22) + SQR(Atm33) + 0.333333333333333333333333333333*SQR(trKL)); - - CCTK_REAL trKrhsL = dottrK; - - CCTK_REAL alpharhsL = - -(pow(alphaL,ToReal(harmonicN))*ToReal(harmonicF)*(trKL + (AL - - trKL)*ToReal(LapseACoeff))); - - CCTK_REAL ArhsL = (dottrK - - AL*ToReal(AlphaDriver))*ToReal(LapseACoeff); - - CCTK_REAL eta = fmin(1,INV(rL)*ToReal(SpatialBetaDriverRadius)); - - CCTK_REAL theta = fmin(1,exp(1 - - rL*INV(ToReal(SpatialShiftGammaCoeffRadius)))); - - CCTK_REAL beta1rhsL = theta*(Xt1L + beta1L*eta*ToReal(BetaDriver)*(-1 - + ToReal(ShiftBCoeff)) + (B1L - - Xt1L)*ToReal(ShiftBCoeff))*ToReal(ShiftGammaCoeff); - - CCTK_REAL beta2rhsL = theta*(Xt2L + beta2L*eta*ToReal(BetaDriver)*(-1 - + ToReal(ShiftBCoeff)) + (B2L - - Xt2L)*ToReal(ShiftBCoeff))*ToReal(ShiftGammaCoeff); - - CCTK_REAL beta3rhsL = theta*(Xt3L + beta3L*eta*ToReal(BetaDriver)*(-1 - + ToReal(ShiftBCoeff)) + (B3L - - Xt3L)*ToReal(ShiftBCoeff))*ToReal(ShiftGammaCoeff); - - CCTK_REAL B1rhsL = (dotXt1 - - B1L*eta*ToReal(BetaDriver))*ToReal(ShiftBCoeff); - - CCTK_REAL B2rhsL = (dotXt2 - - B2L*eta*ToReal(BetaDriver))*ToReal(ShiftBCoeff); - - CCTK_REAL B3rhsL = (dotXt3 - - B3L*eta*ToReal(BetaDriver))*ToReal(ShiftBCoeff); + CCTK_REAL_VEC gt13rhsL = + kmul(ToReal(0.333333333333333333333333333333),kmadd(alphaL,kmul(At13L,ToReal(-6)),kmadd(gt13L,kadd(PDstandardNth1beta1,kmadd(PDstandardNth2beta2,ToReal(-2),PDstandardNth3beta3)),kmul(kmadd(gt23L,PDstandardNth1beta2,kmadd(gt33L,PDstandardNth1beta3,kmadd(gt11L,PDstandardNth3beta1,kmul(gt12L,PDstandardNth3beta2)))),ToReal(3))))); + + CCTK_REAL_VEC gt22rhsL = + kmul(ToReal(-0.666666666666666666666666666667),kmadd(kmadd(gt12L,PDstandardNth2beta1,kmul(gt23L,PDstandardNth2beta3)),ToReal(-3),kmadd(gt22L,kadd(PDstandardNth1beta1,kmadd(PDstandardNth2beta2,ToReal(-2),PDstandardNth3beta3)),kmul(alphaL,kmul(At22L,ToReal(3)))))); + + CCTK_REAL_VEC gt23rhsL = + kmul(ToReal(0.333333333333333333333333333333),kmadd(alphaL,kmul(At23L,ToReal(-6)),kmadd(gt23L,kadd(PDstandardNth2beta2,kmadd(PDstandardNth1beta1,ToReal(-2),PDstandardNth3beta3)),kmul(kmadd(gt13L,PDstandardNth2beta1,kmadd(gt33L,PDstandardNth2beta3,kmadd(gt12L,PDstandardNth3beta1,kmul(gt22L,PDstandardNth3beta2)))),ToReal(3))))); + + CCTK_REAL_VEC gt33rhsL = + kmul(ToReal(-0.666666666666666666666666666667),kmadd(kmadd(gt13L,PDstandardNth3beta1,kmul(gt23L,PDstandardNth3beta2)),ToReal(-3),kmadd(gt33L,kadd(PDstandardNth1beta1,kmadd(PDstandardNth3beta3,ToReal(-2),PDstandardNth2beta2)),kmul(alphaL,kmul(At33L,ToReal(3)))))); + + CCTK_REAL_VEC dotXt1 = + kmul(ToReal(0.333333333333333333333333333333),kmadd(gtu12,kadd(PDstandardNth22beta2,kmadd(alphaL,kmul(S2,ToReal(-150.7964473723100754462068823974161384415)),PDstandardNth23beta3)),kmadd(gtu13,kadd(PDstandardNth23beta2,kmadd(alphaL,kmul(S3,ToReal(-150.7964473723100754462068823974161384415)),PDstandardNth33beta3)),kmadd(kmadd(Atu11,PDstandardNth1alpha,kmadd(Atu12,PDstandardNth2alpha,kmul(Atu13,PDstandardNth3alpha))),ToReal(-6),kmadd(kmadd(PDstandardNth2beta1,Xtn2,kmul(PDstandardNth3beta1,Xtn3)),ToReal(-3),kmadd(Xtn1,kmsub(PDstandardNth3beta3,ToReal(2),PDstandardNth1beta1),kmadd(kmadd(gtu22,PDstandardNth22beta1,kmul(gtu33,PDstandardNth33beta1)),ToReal(3),kmadd(gtu11,kadd(PDstandardNth12beta2,kadd(PDstandardNth13beta3,kmadd(alphaL,kmul(S1,ToReal(-150.7964473723100754462068823974161384415)),kmul(PDstandardNth11beta1,ToReal(4))))),kmadd(gtu23,kmul(PDstandardNth23beta1,ToReal(6)),kmadd(kmadd(gtu12,PDstandardNth12beta1,kmul(gtu13,PDstandardNth13beta1)),ToReal(7),kmul(ToReal(2),kmadd(PDstandardNth2beta2,Xtn1,kmul(alphaL,kmadd(kmadd(gtu11,PDstandardNth1trK,kmadd(gtu12,PDstandardNth2trK,kmul(gtu13,PDstandardNth3trK))),ToReal(-2),kmadd(kmadd(Atu11,Gt111,kmadd(Atu22,Gt122,kmul(Atu33,Gt133))),ToReal(3),kmadd(kmadd(Atu12,Gt112,kmadd(Atu13,Gt113,kmul(Atu23,Gt123))),ToReal(6),kmul(kmadd(Atu11,cdphi1,kmadd(Atu12,cdphi2,kmul(Atu13,cdphi3))),ToReal(18)))))))))))))))))); + + CCTK_REAL_VEC dotXt2 = + kmul(ToReal(0.333333333333333333333333333333),kmadd(kmadd(Atu12,PDstandardNth1alpha,kmadd(Atu22,PDstandardNth2alpha,kmul(Atu23,PDstandardNth3alpha))),ToReal(-6),kmadd(kmadd(PDstandardNth1beta2,Xtn1,kmul(PDstandardNth3beta2,Xtn3)),ToReal(-3),kmadd(Xtn2,kmsub(PDstandardNth3beta3,ToReal(2),PDstandardNth2beta2),kmadd(kmadd(gtu11,PDstandardNth11beta2,kmul(gtu33,PDstandardNth33beta2)),ToReal(3),kmadd(gtu22,kadd(PDstandardNth12beta1,kadd(PDstandardNth23beta3,kmadd(alphaL,kmul(S2,ToReal(-150.7964473723100754462068823974161384415)),kmul(PDstandardNth22beta2,ToReal(4))))),kmadd(gtu13,kmul(PDstandardNth13beta2,ToReal(6)),kmadd(gtu12,kadd(PDstandardNth11beta1,kadd(PDstandardNth13beta3,kmadd(alphaL,kmul(S1,ToReal(-150.7964473723100754462068823974161384415)),kmul(PDstandardNth12beta2,ToReal(7))))),kmadd(gtu23,kadd(PDstandardNth13beta1,kadd(PDstandardNth33beta3,kmadd(alphaL,kmul(S3,ToReal(-150.7964473723100754462068823974161384415)),kmul(PDstandardNth23beta2,ToReal(7))))),kmul(ToReal(2),kmadd(PDstandardNth1beta1,Xtn2,kmul(alphaL,kmadd(kmadd(gtu12,PDstandardNth1trK,kmadd(gtu22,PDstandardNth2trK,kmul(gtu23,PDstandardNth3trK))),ToReal(-2),kmadd(kmadd(Atu11,Gt211,kmadd(Atu22,Gt222,kmul(Atu33,Gt233))),ToReal(3),kmadd(kmadd(Atu12,Gt212,kmadd(Atu13,Gt213,kmul(Atu23,Gt223))),ToReal(6),kmul(kmadd(Atu12,cdphi1,kmadd(Atu22,cdphi2,kmul(Atu23,cdphi3))),ToReal(18))))))))))))))))); + + CCTK_REAL_VEC dotXt3 = + kmul(ToReal(0.333333333333333333333333333333),kmadd(kmadd(Atu13,PDstandardNth1alpha,kmadd(Atu23,PDstandardNth2alpha,kmul(Atu33,PDstandardNth3alpha))),ToReal(-6),kmadd(kmadd(PDstandardNth1beta3,Xtn1,kmul(PDstandardNth2beta3,Xtn2)),ToReal(-3),kmadd(Xtn3,kmsub(PDstandardNth2beta2,ToReal(2),PDstandardNth3beta3),kmadd(kmadd(gtu11,PDstandardNth11beta3,kmul(gtu22,PDstandardNth22beta3)),ToReal(3),kmadd(gtu33,kadd(PDstandardNth13beta1,kadd(PDstandardNth23beta2,kmadd(alphaL,kmul(S3,ToReal(-150.7964473723100754462068823974161384415)),kmul(PDstandardNth33beta3,ToReal(4))))),kmadd(gtu12,kmul(PDstandardNth12beta3,ToReal(6)),kmadd(gtu13,kadd(PDstandardNth11beta1,kadd(PDstandardNth12beta2,kmadd(alphaL,kmul(S1,ToReal(-150.7964473723100754462068823974161384415)),kmul(PDstandardNth13beta3,ToReal(7))))),kmadd(gtu23,kadd(PDstandardNth12beta1,kadd(PDstandardNth22beta2,kmadd(alphaL,kmul(S2,ToReal(-150.7964473723100754462068823974161384415)),kmul(PDstandardNth23beta3,ToReal(7))))),kmul(ToReal(2),kmadd(PDstandardNth1beta1,Xtn3,kmul(alphaL,kmadd(kmadd(gtu13,PDstandardNth1trK,kmadd(gtu23,PDstandardNth2trK,kmul(gtu33,PDstandardNth3trK))),ToReal(-2),kmadd(kmadd(Atu11,Gt311,kmadd(Atu22,Gt322,kmul(Atu33,Gt333))),ToReal(3),kmadd(kmadd(Atu12,Gt312,kmadd(Atu13,Gt313,kmul(Atu23,Gt323))),ToReal(6),kmul(kmadd(Atu13,cdphi1,kmadd(Atu23,cdphi2,kmul(Atu33,cdphi3))),ToReal(18))))))))))))))))); + + CCTK_REAL_VEC Xt1rhsL = dotXt1; + + CCTK_REAL_VEC Xt2rhsL = dotXt2; + + CCTK_REAL_VEC Xt3rhsL = dotXt3; + + CCTK_REAL_VEC dottrK = + kmsub(alphaL,kadd(SQR(Atm11),kadd(SQR(Atm22),kadd(SQR(Atm33),kmadd(SQR(trKL),ToReal(0.333333333333333333333333333333),kmadd(kmadd(Atm12,Atm21,kmadd(Atm13,Atm31,kmul(Atm23,Atm32))),ToReal(2),kmul(kadd(rho,trS),ToReal(12.56637061435917295385057353311801153679))))))),kmul(em4phi,kmadd(gtu11,PDstandardNth11alpha,kmadd(gtu22,PDstandardNth22alpha,knmsub(PDstandardNth3alpha,Xtn3,kmadd(kmadd(gtu12,PDstandardNth12alpha,kmadd(gtu13,kmadd(cdphi1,PDstandardNth3alpha,PDstandardNth13alpha),kmul(gtu23,kmadd(cdphi2,PDstandardNth3alpha,PDstandardNth23alpha)))),ToReal(2),kmadd(PDstandardNth1alpha,kmsub(kmadd(cdphi1,gtu11,kmadd(cdphi2,gtu12,kmul(cdphi3,gtu13))),ToReal(2),Xtn1),kmadd(PDstandardNth2alpha,kmsub(kmadd(cdphi1,gtu12,kmadd(cdphi2,gtu22,kmul(cdphi3,gtu23))),ToReal(2),Xtn2),kmul(gtu33,kmadd(cdphi3,kmul(PDstandardNth3alpha,ToReal(2)),PDstandardNth33alpha)))))))))); + + CCTK_REAL_VEC trKrhsL = dottrK; + + CCTK_REAL_VEC alpharhsL = + kneg(kmul(kpow(alphaL,harmonicN),kmul(ToReal(harmonicF),kmadd(ksub(AL,trKL),ToReal(LapseACoeff),trKL)))); + + CCTK_REAL_VEC ArhsL = + kmul(knmsub(AL,ToReal(AlphaDriver),dottrK),ToReal(LapseACoeff)); + + CCTK_REAL_VEC eta = + kfmin(ToReal(1),kmul(INV(rL),ToReal(SpatialBetaDriverRadius))); + + CCTK_REAL_VEC theta = + kfmin(ToReal(1),kexp(knmsub(rL,INV(ToReal(SpatialShiftGammaCoeffRadius)),ToReal(1)))); + + CCTK_REAL_VEC beta1rhsL = + kmul(theta,kmul(kadd(Xt1L,kmadd(beta1L,kmul(eta,ToReal(BetaDriver*(-1 + + ShiftBCoeff))),kmul(ksub(B1L,Xt1L),ToReal(ShiftBCoeff)))),ToReal(ShiftGammaCoeff))); + + CCTK_REAL_VEC beta2rhsL = + kmul(theta,kmul(kadd(Xt2L,kmadd(beta2L,kmul(eta,ToReal(BetaDriver*(-1 + + ShiftBCoeff))),kmul(ksub(B2L,Xt2L),ToReal(ShiftBCoeff)))),ToReal(ShiftGammaCoeff))); + + CCTK_REAL_VEC beta3rhsL = + kmul(theta,kmul(kadd(Xt3L,kmadd(beta3L,kmul(eta,ToReal(BetaDriver*(-1 + + ShiftBCoeff))),kmul(ksub(B3L,Xt3L),ToReal(ShiftBCoeff)))),ToReal(ShiftGammaCoeff))); + + CCTK_REAL_VEC B1rhsL = + kmul(knmsub(B1L,kmul(eta,ToReal(BetaDriver)),dotXt1),ToReal(ShiftBCoeff)); + + CCTK_REAL_VEC B2rhsL = + kmul(knmsub(B2L,kmul(eta,ToReal(BetaDriver)),dotXt2),ToReal(ShiftBCoeff)); + + CCTK_REAL_VEC B3rhsL = + kmul(knmsub(B3L,kmul(eta,ToReal(BetaDriver)),dotXt3),ToReal(ShiftBCoeff)); + + /* If necessary, store only partial vectors after the first iteration */ + + if (CCTK_REAL_VEC_SIZE > 2 && CCTK_BUILTIN_EXPECT(i < lc_imin && i+CCTK_REAL_VEC_SIZE > lc_imax, 0)) + { + ptrdiff_t const elt_count_lo = lc_imin-i; + ptrdiff_t const elt_count_hi = lc_imax-i; + vec_store_nta_partial_mid(alpharhs[index],alpharhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(Arhs[index],ArhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(B1rhs[index],B1rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(B2rhs[index],B2rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(B3rhs[index],B3rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(beta1rhs[index],beta1rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(beta2rhs[index],beta2rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(beta3rhs[index],beta3rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(gt11rhs[index],gt11rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(gt12rhs[index],gt12rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(gt13rhs[index],gt13rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(gt22rhs[index],gt22rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(gt23rhs[index],gt23rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(gt33rhs[index],gt33rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(phirhs[index],phirhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(trKrhs[index],trKrhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(Xt1rhs[index],Xt1rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(Xt2rhs[index],Xt2rhsL,elt_count_lo,elt_count_hi); + vec_store_nta_partial_mid(Xt3rhs[index],Xt3rhsL,elt_count_lo,elt_count_hi); + break; + } + + /* If necessary, store only partial vectors after the first iteration */ + + if (CCTK_REAL_VEC_SIZE > 1 && CCTK_BUILTIN_EXPECT(i < lc_imin, 0)) + { + ptrdiff_t const elt_count = lc_imin-i; + vec_store_nta_partial_hi(alpharhs[index],alpharhsL,elt_count); + vec_store_nta_partial_hi(Arhs[index],ArhsL,elt_count); + vec_store_nta_partial_hi(B1rhs[index],B1rhsL,elt_count); + vec_store_nta_partial_hi(B2rhs[index],B2rhsL,elt_count); + vec_store_nta_partial_hi(B3rhs[index],B3rhsL,elt_count); + vec_store_nta_partial_hi(beta1rhs[index],beta1rhsL,elt_count); + vec_store_nta_partial_hi(beta2rhs[index],beta2rhsL,elt_count); + vec_store_nta_partial_hi(beta3rhs[index],beta3rhsL,elt_count); + vec_store_nta_partial_hi(gt11rhs[index],gt11rhsL,elt_count); + vec_store_nta_partial_hi(gt12rhs[index],gt12rhsL,elt_count); + vec_store_nta_partial_hi(gt13rhs[index],gt13rhsL,elt_count); + vec_store_nta_partial_hi(gt22rhs[index],gt22rhsL,elt_count); + vec_store_nta_partial_hi(gt23rhs[index],gt23rhsL,elt_count); + vec_store_nta_partial_hi(gt33rhs[index],gt33rhsL,elt_count); + vec_store_nta_partial_hi(phirhs[index],phirhsL,elt_count); + vec_store_nta_partial_hi(trKrhs[index],trKrhsL,elt_count); + vec_store_nta_partial_hi(Xt1rhs[index],Xt1rhsL,elt_count); + vec_store_nta_partial_hi(Xt2rhs[index],Xt2rhsL,elt_count); + vec_store_nta_partial_hi(Xt3rhs[index],Xt3rhsL,elt_count); + continue; + } + + /* If necessary, store only partial vectors after the last iteration */ + + if (CCTK_REAL_VEC_SIZE > 1 && CCTK_BUILTIN_EXPECT(i+CCTK_REAL_VEC_SIZE > lc_imax, 0)) + { + ptrdiff_t const elt_count = lc_imax-i; + vec_store_nta_partial_lo(alpharhs[index],alpharhsL,elt_count); + vec_store_nta_partial_lo(Arhs[index],ArhsL,elt_count); + vec_store_nta_partial_lo(B1rhs[index],B1rhsL,elt_count); + vec_store_nta_partial_lo(B2rhs[index],B2rhsL,elt_count); + vec_store_nta_partial_lo(B3rhs[index],B3rhsL,elt_count); + vec_store_nta_partial_lo(beta1rhs[index],beta1rhsL,elt_count); + vec_store_nta_partial_lo(beta2rhs[index],beta2rhsL,elt_count); + vec_store_nta_partial_lo(beta3rhs[index],beta3rhsL,elt_count); + vec_store_nta_partial_lo(gt11rhs[index],gt11rhsL,elt_count); + vec_store_nta_partial_lo(gt12rhs[index],gt12rhsL,elt_count); + vec_store_nta_partial_lo(gt13rhs[index],gt13rhsL,elt_count); + vec_store_nta_partial_lo(gt22rhs[index],gt22rhsL,elt_count); + vec_store_nta_partial_lo(gt23rhs[index],gt23rhsL,elt_count); + vec_store_nta_partial_lo(gt33rhs[index],gt33rhsL,elt_count); + vec_store_nta_partial_lo(phirhs[index],phirhsL,elt_count); + vec_store_nta_partial_lo(trKrhs[index],trKrhsL,elt_count); + vec_store_nta_partial_lo(Xt1rhs[index],Xt1rhsL,elt_count); + vec_store_nta_partial_lo(Xt2rhs[index],Xt2rhsL,elt_count); + vec_store_nta_partial_lo(Xt3rhs[index],Xt3rhsL,elt_count); + break; + } /* Copy local copies back to grid functions */ - alpharhs[index] = alpharhsL; - Arhs[index] = ArhsL; - B1rhs[index] = B1rhsL; - B2rhs[index] = B2rhsL; - B3rhs[index] = B3rhsL; - beta1rhs[index] = beta1rhsL; - beta2rhs[index] = beta2rhsL; - beta3rhs[index] = beta3rhsL; - gt11rhs[index] = gt11rhsL; - gt12rhs[index] = gt12rhsL; - gt13rhs[index] = gt13rhsL; - gt22rhs[index] = gt22rhsL; - gt23rhs[index] = gt23rhsL; - gt33rhs[index] = gt33rhsL; - phirhs[index] = phirhsL; - trKrhs[index] = trKrhsL; - Xt1rhs[index] = Xt1rhsL; - Xt2rhs[index] = Xt2rhsL; - Xt3rhs[index] = Xt3rhsL; + vec_store_nta(alpharhs[index],alpharhsL); + vec_store_nta(Arhs[index],ArhsL); + vec_store_nta(B1rhs[index],B1rhsL); + vec_store_nta(B2rhs[index],B2rhsL); + vec_store_nta(B3rhs[index],B3rhsL); + vec_store_nta(beta1rhs[index],beta1rhsL); + vec_store_nta(beta2rhs[index],beta2rhsL); + vec_store_nta(beta3rhs[index],beta3rhsL); + vec_store_nta(gt11rhs[index],gt11rhsL); + vec_store_nta(gt12rhs[index],gt12rhsL); + vec_store_nta(gt13rhs[index],gt13rhsL); + vec_store_nta(gt22rhs[index],gt22rhsL); + vec_store_nta(gt23rhs[index],gt23rhsL); + vec_store_nta(gt33rhs[index],gt33rhsL); + vec_store_nta(phirhs[index],phirhsL); + vec_store_nta(trKrhs[index],trKrhsL); + vec_store_nta(Xt1rhs[index],Xt1rhsL); + vec_store_nta(Xt2rhs[index],Xt2rhsL); + vec_store_nta(Xt3rhs[index],Xt3rhsL); } - LC_ENDLOOP3 (ML_BSSN_RHS1); + LC_ENDLOOP3VEC (ML_BSSN_RHS1); } extern "C" void ML_BSSN_RHS1(CCTK_ARGUMENTS) |