Merge /Users/eschnett/Cbeta/carpet

author: Erik Schnetter <schnetter@cct.lsu.edu> 2008-07-22 13:47:09 -0500
committer: Erik Schnetter <schnetter@cct.lsu.edu> 2008-07-22 13:47:09 -0500
commit: b4da2bc7694fff331465ce0185daf70b126a0793 (patch)
tree: 5abefedf02bcd4842fe424b6e3809a6a896a5382
parent: 679c409c327078bb41481fba8757063e29cf5525 (diff)
parent: 5c20bc1bd05c8d870508d887de4fbe9a04a61e39 (diff)
41 files changed, 1731 insertions, 219 deletions
diff --git a/Carpet/Carpet/src/Comm.cc b/Carpet/Carpet/src/Comm.cc
index b09869ef9..be89d8b9d 100644
--- a/Carpet/Carpet/src/Comm.cc
+++ b/Carpet/Carpet/src/Comm.cc
@@ -2,6 +2,7 @@
 #include <cassert>
 #include <cmath>
 #include <cstdlib>
+#include <iostream>
 
 #include "cctk.h"
 #include "cctk_Parameters.h"
@@ -18,6 +19,7 @@ namespace Carpet {
   using namespace std;
 
 
+
   static void ProlongateGroupBoundaries (const cGH* cctkGH,
                                          CCTK_REAL initial_time,
                                          const vector<int>& groups);
@@ -144,8 +146,9 @@ namespace Carpet {
               mytime = vtt.at(map)->time (0, reflevel, mglevel);
               parenttime = vtt.at(map)->time (0, reflevel - 1, mglevel);
             }
+            CCTK_REAL const eps = 1.0e-12;
             bool const in_sync =
-              abs (mytime - parenttime) < 1.0e-10 * abs (delta_time);
+              abs (mytime - parenttime) <= eps * abs (delta_time);
             local_do_prolongate = in_sync;
           }
         } else {                // no tapered grids
diff --git a/Carpet/Carpet/src/Initialise.cc b/Carpet/Carpet/src/Initialise.cc
index 08a00aa84..14cc708a7 100644
--- a/Carpet/Carpet/src/Initialise.cc
+++ b/Carpet/Carpet/src/Initialise.cc
@@ -829,12 +829,7 @@ namespace Carpet {
         
         if (did_regrid) {
           for (int rl=0; rl<reflevels; ++rl) {
-            
-            bool did_recompose = false;
-            if (did_regrid) {
-              did_recompose = Recompose (cctkGH, rl, prolongate_initial_data);
-            }
-            
+            Recompose (cctkGH, rl, prolongate_initial_data);
           } // for rl
         } // if did_regrid
         
diff --git a/Carpet/Carpet/src/Recompose.cc b/Carpet/Carpet/src/Recompose.cc
index 696adf7ca..3ab820910 100644
--- a/Carpet/Carpet/src/Recompose.cc
+++ b/Carpet/Carpet/src/Recompose.cc
@@ -234,6 +234,7 @@ namespace Carpet {
     // Write grid structure to file
     OutputGridStructure (cctkGH, m, regsss);
     OutputGridCoordinates (cctkGH, m, regsss);
+#warning "TODO: output superregss"
     
     if (verbose or veryverbose) {
       OutputGrids (cctkGH, m, * vhh.at(m), * vdd.at(m));
@@ -1375,6 +1376,9 @@ namespace Carpet {
     if (DEBUG) cout << "SRMA mynprocs " << mynprocs << endl;
     
     if (DEBUG) cout << "SRMA: splitting work units" << endl;
+#warning "TODO: rename newregs to regs"
+#warning "TODO: rename nregs to nsuperregs"
+#warning "TODO: rename newnregs to nregs"
     vector<region_t> newregs;
     newregs.reserve (newnregs);
     for (int r=0, p=0; r<nregs; p+=mynprocs.at(r), ++r) {
diff --git a/Carpet/Carpet/src/Requirements.cc b/Carpet/Carpet/src/Requirements.cc
index 6a4a83ebc..c1d54f87b 100644
--- a/Carpet/Carpet/src/Requirements.cc
+++ b/Carpet/Carpet/src/Requirements.cc
@@ -73,7 +73,7 @@ namespace Carpet {
     int CheckEntry (void * attribute, void * data);
     int CheckExit  (void * attribute, void * data);
     int CheckWhile (int n_whiles, char ** whiles, void * attribute, void * data, int first);
-    int CheckIf    (int n_ifs, char ** ifs, void * attribute, void * data);
+    int CheckIf    (int n_ifs, char ** ifs, void * attribute, void * data, int first);
     int CheckCall  (void * function, void * attribute, void * data);
     
     void CheckOneGroup (cGH const * cctkGH, char const * where);
@@ -214,7 +214,8 @@ namespace Carpet {
     int
     CheckIf (int const n_ifs, char ** const ifs,
              void * const attribute,
-             void * const data)
+             void * const data,
+             int const first)
     {
       // Execute item
       return 1;
diff --git a/Carpet/Carpet/src/Restrict.cc b/Carpet/Carpet/src/Restrict.cc
index fbe9f59af..f1b047384 100644
--- a/Carpet/Carpet/src/Restrict.cc
+++ b/Carpet/Carpet/src/Restrict.cc
@@ -17,10 +17,10 @@ namespace Carpet {
   using namespace std;
   
   // restricts a set of groups
-  static void RestrictGroups (const cGH* cgh, const vector<int>& groups);
+  static void RestrictGroups (const cGH* cctkGH, const vector<int>& groups);
   
   
-  void Restrict (const cGH* cgh)
+  void Restrict (const cGH* cctkGH)
   {
     DECLARE_CCTK_PARAMETERS;
     
@@ -45,21 +45,21 @@ namespace Carpet {
     for (int group = 0; group < CCTK_NumGroups(); ++group) {
       if (CCTK_GroupTypeI(group) == CCTK_GF
           and CCTK_NumVarsInGroupI(group) > 0
-          and CCTK_QueryGroupStorageI(cgh, group)) {
+          and CCTK_QueryGroupStorageI(cctkGH, group)) {
         groups.push_back (group);
       }
     }
 
     // Restrict
-    RestrictGroups (cgh, groups);
+    RestrictGroups (cctkGH, groups);
 
     // Synchronise
-    SyncGroups (cgh, groups);
+    SyncGroups (cctkGH, groups);
   }
   
 
   // restricts a set of groups which all have the same vartype
-  static void RestrictGroups (const cGH* cgh, const vector<int>& groups) {
+  static void RestrictGroups (const cGH* cctkGH, const vector<int>& groups) {
     DECLARE_CCTK_PARAMETERS;
 
     const int tl = 0;
@@ -74,12 +74,15 @@ namespace Carpet {
           const CCTK_REAL time = vtt.at(m)->time (tl, reflevel, mglevel);
 
           const CCTK_REAL time1 = vtt.at(m)->time (0, reflevel, mglevel);
-          const CCTK_REAL time2
-            = (cgh->cctk_time - cctk_initial_time) / delta_time;
-          assert (abs(time1 - time2) / (abs(time1) + abs(time2) + abs(cgh->cctk_delta_time)) < 1e-12);
-
-          for (int v = 0; v < (int)arrdata.at(group).at(m).data.size(); ++v) {
-            ggf *const gv = arrdata.at(group).at(m).data.at(v);
+          const CCTK_REAL time2 =
+            (cctkGH->cctk_time - cctk_initial_time) / delta_time;
+          const CCTK_REAL time0 =
+            abs(time1) + abs(time2) + abs(cctkGH->cctk_delta_time);
+          const CCTK_REAL eps = 1.0e-12;
+          assert (abs(time1 - time2) <= eps * time0);
+
+          for (int v = 0; v < (int)arrdata.at(g).at(m).data.size(); ++v) {
+            ggf *const gv = arrdata.at(g).at(m).data.at(v);
 #if 0
             for (int c = 0; c < vhh.at(m)->components(reflevel); ++c) {
               gv->ref_restrict (state, tl, reflevel, c, mglevel, time);
diff --git a/Carpet/Carpet/src/SetupGH.cc b/Carpet/Carpet/src/SetupGH.cc
index b2bf94b70..7644c3733 100644
--- a/Carpet/Carpet/src/SetupGH.cc
+++ b/Carpet/Carpet/src/SetupGH.cc
@@ -1104,9 +1104,7 @@ namespace Carpet {
     if (domain_from_multipatch or domain_from_coordbase) {
       
       jjvect nboundaryzones_, is_internal_, is_staggered_, shiftout_;
-      if (domain_from_multipatch and
-          CCTK_IsFunctionAliased ("MultiPatch_GetBoundarySpecification"))
-      {
+      if (CCTK_IsFunctionAliased ("MultiPatch_GetBoundarySpecification")) {
         int const ierr =
           MultiPatch_GetBoundarySpecification (m,
                                                2*dim,
diff --git a/Carpet/Carpet/src/carpet_public.hh b/Carpet/Carpet/src/carpet_public.hh
index 5210ea45c..bd70dc047 100644
--- a/Carpet/Carpet/src/carpet_public.hh
+++ b/Carpet/Carpet/src/carpet_public.hh
@@ -9,6 +9,4 @@
 #include "modes.hh"
 #include "variables.hh"
 
-#include "defines.hh"
-
 #endif // !defined(CARPET_PUBLIC_HH)
diff --git a/Carpet/Carpet/src/defines.hh b/Carpet/Carpet/src/defines.hh
deleted file mode 100644
index 878407b69..000000000
--- a/Carpet/Carpet/src/defines.hh
+++ /dev/null
@@ -1,21 +0,0 @@
-#ifndef DEFINES_HH
-#define DEFINES_HH
-
-#include "cctk.h"
-
-#include <defs.hh>
-
-
-
-namespace Carpet {
-  
-  typedef vect<CCTK_INT,dim> jvect;
-  typedef vect<CCTK_REAL,dim> rvect;
-  typedef bbox<CCTK_INT,dim> jbbox;
-  typedef bbox<CCTK_REAL,dim> rbbox;
-  
-  typedef vect<vect<CCTK_INT,2>,dim> jjvect;
-  
-} // namespace Carpet
-
-#endif // !defined(DEFINES_HH)
diff --git a/Carpet/Carpet/src/functions.hh b/Carpet/Carpet/src/functions.hh
index ef86ca3c9..0d1e9104b 100644
--- a/Carpet/Carpet/src/functions.hh
+++ b/Carpet/Carpet/src/functions.hh
@@ -15,8 +15,6 @@
 #include "gh.hh"
 #include "vect.hh"
 
-#include "defines.hh"
-
 
   
 namespace Carpet {
diff --git a/Carpet/Carpet/src/variables.hh b/Carpet/Carpet/src/variables.hh
index a50d471ca..e80f5ae86 100644
--- a/Carpet/Carpet/src/variables.hh
+++ b/Carpet/Carpet/src/variables.hh
@@ -28,7 +28,6 @@
 #include "vect.hh"
 
 #include "carpet_public.h"
-#include "defines.hh"
 
 
 
diff --git a/Carpet/CarpetInterp/interface.ccl b/Carpet/CarpetInterp/interface.ccl
index 5b6ca8316..506f0a1db 100644
--- a/Carpet/CarpetInterp/interface.ccl
+++ b/Carpet/CarpetInterp/interface.ccl
@@ -2,12 +2,16 @@
 
 IMPLEMENTS: interp
 
-uses include header: carpet.hh
-
+uses include header: data.hh
 uses include header: bbox.hh
+uses include header: data.hh
+uses include header: defs.hh
+uses include header: dist.hh
+uses include header: ggf.hh
+uses include header: timestat.hh
 uses include header: vect.hh
 
-uses include header: data.hh
+uses include header: carpet.hh
 
 
 
diff --git a/Carpet/CarpetInterp/src/interp.cc b/Carpet/CarpetInterp/src/interp.cc
index 3fcadc9ac..86bc650ff 100644
--- a/Carpet/CarpetInterp/src/interp.cc
+++ b/Carpet/CarpetInterp/src/interp.cc
@@ -19,6 +19,7 @@
 #include "defs.hh"
 #include "dist.hh"
 #include "ggf.hh"
+#include "timestat.hh"
 #include "vect.hh"
 
 #include "carpet.hh"
@@ -83,7 +84,7 @@ namespace CarpetInterp {
               int const maxncomps,
               int const N_dims,
               int const npoints,
-              vector<CCTK_INT> const& source_map,
+              vector<CCTK_INT> & source_map,
               void const * const coords_list[],
               vector<CCTK_REAL> const& coords,
               vector<int>& procs,
@@ -186,6 +187,16 @@ namespace CarpetInterp {
 
 
 
+  static void timer_CDI (bool const dostart)
+  {
+    static Timer timer_CDI ("CarpetInterp::Carpet_DriverInterpolate");
+    if (dostart) {
+      timer_CDI.start ();
+    } else {
+      timer_CDI.stop (0);
+    }
+  }
+
   extern "C" CCTK_INT
   Carpet_DriverInterpolate (CCTK_POINTER_TO_CONST const cctkGH_,
                             CCTK_INT const N_dims,
@@ -203,6 +214,8 @@ namespace CarpetInterp {
   {
     DECLARE_CCTK_PARAMETERS;
 
+    timer_CDI (true);
+
     cGH const * const cctkGH = static_cast<cGH const *> (cctkGH_);
     assert (cctkGH);
     assert (0 <= N_dims and N_dims <= dim);
@@ -357,15 +370,18 @@ namespace CarpetInterp {
     CCTK_REAL current_time, delta_time;
     int prolongation_order_time;
 
-    int iret = extract_parameter_table_options
-      (cctkGH,
-       param_table_handle,
-       N_interp_points, N_input_arrays, N_output_arrays,
-       have_source_map, num_time_derivs,
-       prolongation_order_time, current_time, delta_time,
-       source_map, operand_indices, time_deriv_order);
-    if (iret < 0) {
-      return iret;
+    {
+      int const iret = extract_parameter_table_options
+        (cctkGH,
+         param_table_handle,
+         N_interp_points, N_input_arrays, N_output_arrays,
+         have_source_map, num_time_derivs,
+         prolongation_order_time, current_time, delta_time,
+         source_map, operand_indices, time_deriv_order);
+      if (iret < 0) {
+        timer_CDI (false);
+        return iret;
+      }
     }
 
     //////////////////////////////////////////////////////////////////////
@@ -401,9 +417,14 @@ namespace CarpetInterp {
       assert ((int)N_points_from.size() == dist::size());
       assert ((int)N_points_to.size() == dist::size());
     }
-    MPI_Alltoall (&N_points_to[0],   1, dist::datatype (N_points_to[0]),
-                  &N_points_from[0], 1, dist::datatype (N_points_from[0]),
-                  dist::comm());
+    {
+      static Timer timer ("CarpetInterp::send_npoints");
+      timer.start ();
+      MPI_Alltoall (&N_points_to[0],   1, dist::datatype (N_points_to[0]),
+                    &N_points_from[0], 1, dist::datatype (N_points_from[0]),
+                    dist::comm());
+      timer.stop (dist::size() * sizeof(CCTK_INT));
+    }
     //cout << "CarpetInterp: N_points_from=" << N_points_from << endl;
 
     //////////////////////////////////////////////////////////////////////
@@ -495,9 +516,14 @@ namespace CarpetInterp {
         tmp.AT(i) = poison;
       }
 #endif
-      MPI_Alltoallv (&coords_buffer[0], &sendcnt[0], &senddispl[0], datatype,
-                     &tmp[0],           &recvcnt[0], &recvdispl[0], datatype,
-                     dist::comm());
+      {
+        static Timer timer ("CarpetInterp::send_coordinates");
+        timer.start ();
+        MPI_Alltoallv (&coords_buffer[0], &sendcnt[0], &senddispl[0], datatype,
+                       &tmp[0],           &recvcnt[0], &recvdispl[0], datatype,
+                       dist::comm());
+        timer.stop (coords_buffer.size() * sizeof(CCTK_REAL));
+      }
 #ifndef _NDEBUG
       {
         vector<bool> filled(tmp.size(), false);
@@ -606,9 +632,14 @@ namespace CarpetInterp {
         source_map[i] = ipoison;
       }
 #endif
-      MPI_Alltoallv (&tmp[0],        &sendcnt[0], &senddispl[0], datatype,
-                     &source_map[0], &recvcnt[0], &recvdispl[0], datatype,
-                     dist::comm());
+      {
+        static Timer timer ("CarpetInterp::send_maps");
+        timer.start ();
+        MPI_Alltoallv (&tmp[0],        &sendcnt[0], &senddispl[0], datatype,
+                       &source_map[0], &recvcnt[0], &recvdispl[0], datatype,
+                       dist::comm());
+        timer.stop (tmp.size() * sizeof(CCTK_INT));
+      }
 #ifndef _NDEBUG
       {
         vector<bool> filled(source_map.size(), false);
@@ -795,9 +826,14 @@ namespace CarpetInterp {
           assert (recvdispl.AT(n) + recvcnt.AT(n) <= recvbufsize);
         }
       }
-      MPI_Alltoallv (&outputs_buffer[0], &sendcnt[0], &senddispl[0], datatype,
-                     &tmp[0],            &recvcnt[0], &recvdispl[0], datatype,
-                     dist::comm());
+      {
+        static Timer timer ("CarpetInterp::recv_points");
+        timer.start ();
+        MPI_Alltoallv (&outputs_buffer[0], &sendcnt[0], &senddispl[0], datatype,
+                       &tmp[0],            &recvcnt[0], &recvdispl[0], datatype,
+                       dist::comm());
+        timer.stop (N_interp_points * N_output_arrays * vtypesize);
+      }
       outputs_buffer.swap (tmp);
     }
 
@@ -864,7 +900,11 @@ namespace CarpetInterp {
     assert (ierr >= 0);
 
     // Done.
-    return per_proc_retvals[dist::rank()];
+    {
+      timer_CDI (false);
+      int const iret = per_proc_retvals[dist::rank()];
+      return iret;
+    }
   }
 
 
@@ -917,6 +957,9 @@ namespace CarpetInterp {
       // Check source map
 #pragma omp parallel for
       for (int n = 0; n < (int)source_map.size(); ++n) {
+        if (not (source_map.AT(n) >= 0 and source_map.AT(n) < maps)) {
+          cout << "CI: n=" << n << " map=" << source_map.AT(n) << endl;
+        }
         assert (source_map.AT(n) >= 0 and source_map.AT(n) < maps);
       }
     }
@@ -1103,7 +1146,7 @@ namespace CarpetInterp {
               int const maxncomps,
               int const N_dims,
               int const npoints,
-              vector<CCTK_INT> const& source_map,
+              vector<CCTK_INT> & source_map,
               void const* const coords_list[],
               vector<CCTK_REAL> const& coords,
               vector<int>& procs,
@@ -1114,6 +1157,9 @@ namespace CarpetInterp {
   {
     DECLARE_CCTK_PARAMETERS;
 
+    static Timer timer ("CarpetInterp::map_points");
+    timer.start ();
+
     bool const map_onto_processors = coords_list != NULL;
 
     if (not map_onto_processors) {
@@ -1179,45 +1225,50 @@ namespace CarpetInterp {
 #pragma omp parallel for
     for (int n = 0; n < npoints; ++n) {
 
-      int const m = source_map.AT(n);
-
-      gh const * const hh = arrdata.AT(coord_group).AT(m).hh;
-
-      // Find the grid point closest to the interpolation point
+      int & m = source_map.AT(n);
+      int rl, c = -1;
       rvect pos;
-      for (int d = 0; d < N_dims; ++d) {
-        if (map_onto_processors) {
-          pos[d] = static_cast<CCTK_REAL const *>(coords_list[d])[n];
-        } else {
-          pos[d] = coords[N_dims*n + d];
+      gh const * hh = NULL;
+
+      if (m >= 0) {
+        
+        hh = arrdata.AT(coord_group).AT(m).hh;
+        
+        // Find the grid point closest to the interpolation point
+        for (int d = 0; d < N_dims; ++d) {
+          if (map_onto_processors) {
+            pos[d] = static_cast<CCTK_REAL const *>(coords_list[d])[n];
+          } else {
+            pos[d] = coords[N_dims*n + d];
+          }
         }
-      }
-      
-      // Find the component that this grid point belongs to
-      
-      // Calculate rl, c, and proc
-      int rl, c;
-      if (not tree_search) {
-        find_location_linear
-          (hh, pos, lower.AT(m), upper.AT(m), delta.AT(m), ml, minrl, maxrl,
-           rl, c);
-      } else {
-        find_location_tree
-          (hh, pos, lower.AT(m), upper.AT(m), delta.AT(m), ml, minrl, maxrl,
-           rl, c);
-        if (check_tree_search) {
-          int rl2, c2;
+        
+        // Find the component that this grid point belongs to
+        
+        // Calculate rl, c, and proc
+        if (not tree_search) {
           find_location_linear
             (hh, pos, lower.AT(m), upper.AT(m), delta.AT(m), ml, minrl, maxrl,
-             rl2, c2);
-          if (rl2!=rl or c2!=c) {
+           rl, c);
+        } else {
+          find_location_tree
+            (hh, pos, lower.AT(m), upper.AT(m), delta.AT(m), ml, minrl, maxrl,
+             rl, c);
+          if (check_tree_search) {
+            int rl2, c2;
+            find_location_linear
+              (hh, pos, lower.AT(m), upper.AT(m), delta.AT(m), ml, minrl, maxrl,
+               rl2, c2);
+            if (rl2!=rl or c2!=c) {
 #pragma omp critical
-            CCTK_VWarn (CCTK_WARN_ABORT, __LINE__, __FILE__, CCTK_THORNSTRING,
-                      "Inconsistent search result from find_location_tree for interpolation point #%d at [%g,%g,%g] of patch #%d is not on any component",
-                        n, (double)pos[0], (double)pos[1], (double)pos[2], (int)m);
+              CCTK_VWarn (CCTK_WARN_ABORT, __LINE__, __FILE__, CCTK_THORNSTRING,
+                          "Inconsistent search result from find_location_tree for interpolation point #%d at [%g,%g,%g] of patch #%d is not on any component",
+                          n, (double)pos[0], (double)pos[1], (double)pos[2], (int)m);
+            }
           }
         }
-      }
+        
+      } // if m >= 0
       
       if (c == -1) {
         // The point could not be mapped onto any component
@@ -1238,13 +1289,12 @@ namespace CarpetInterp {
         rl = minrl;
         c = 0;
         
-        // Does this refinement level actually have a component?  (It
-        // may not, if this is a multi-patch simulation.)
-        if (not (hh->components(rl) > c)) {
-          cout << "CI: m=" << m << " pos=" << pos << endl;
-          CCTK_WARN (CCTK_WARN_ABORT, "Cannot interpolate a point from a patch which does not have any components at this refinement level.  Very likely your multi-patch grid structure is inconsistent, e.g. with refinement boundaries too close to a multi-patch boundary.");
-        } 
-        assert (hh->components(rl) > c);
+        // Find a patch which exists on this processor
+        for (m=0; m<maps; ++m) {
+          hh = arrdata.AT(coord_group).AT(m).hh;
+          if (hh->components(rl) > c) break;
+        }
+        assert (m < maps);
       }
       
       if (not (rl >= minrl and rl < maxrl) or
@@ -1269,6 +1319,7 @@ namespace CarpetInterp {
       ++ this_homecnts;
       
     } // for n
+    timer.stop (npoints);
   }
 
 
@@ -1299,6 +1350,9 @@ namespace CarpetInterp {
                           CCTK_INT const output_array_type_codes [],
                           CCTK_INT const input_array_variable_indices [])
   {
+    static Timer timer ("CarpetInterp::interpolate_components");
+    timer.start();
+
     // Find out about the number of time levels for interpolation
     // for all input arrays
     vector<CCTK_INT> interp_num_time_levels (N_input_arrays, 0);
@@ -1390,6 +1444,8 @@ namespace CarpetInterp {
       } // for rl
 
     } END_GLOBAL_MODE;
+
+    timer.stop (0);
   }
 
   ///////////////////////////////////////////////////////////////////////////
@@ -1562,6 +1618,9 @@ namespace CarpetInterp {
                                 CCTK_INT const output_array_type_codes [],
                                 CCTK_INT const input_array_variable_indices [])
   {
+    static Timer timer ("CarpetInterp::interpolate_single_component");
+    timer.start();
+
     // Find out the datatypes of all input grid arrays
     vector<CCTK_INT> input_array_type_codes(N_input_arrays, -1);
     vector<const void *> input_arrays(N_input_arrays);
@@ -1772,6 +1831,7 @@ namespace CarpetInterp {
       } // if need_time_interp
     } // for j
 
+    timer.stop (0);
   }
 
 } // namespace CarpetInterp
diff --git a/Carpet/CarpetInterp2/COPYING b/Carpet/CarpetInterp2/COPYING
new file mode 100644
index 000000000..1942c4334
--- /dev/null
+++ b/Carpet/CarpetInterp2/COPYING
@@ -0,0 +1,341 @@
+		    GNU GENERAL PUBLIC LICENSE
+		       Version 2, June 1991
+
+ Copyright (C) 1989, 1991 Free Software Foundation, Inc.
+                          59 Temple Place - Suite 330
+                          Boston, MA 02111-1307, USA.
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+			    Preamble
+
+  The licenses for most software are designed to take away your
+freedom to share and change it.  By contrast, the GNU General Public
+License is intended to guarantee your freedom to share and change free
+software--to make sure the software is free for all its users.  This
+General Public License applies to most of the Free Software
+Foundation's software and to any other program whose authors commit to
+using it.  (Some other Free Software Foundation software is covered by
+the GNU Library General Public License instead.)  You can apply it to
+your programs, too.
+
+  When we speak of free software, we are referring to freedom, not
+price.  Our General Public Licenses are designed to make sure that you
+have the freedom to distribute copies of free software (and charge for
+this service if you wish), that you receive source code or can get it
+if you want it, that you can change the software or use pieces of it
+in new free programs; and that you know you can do these things.
+
+  To protect your rights, we need to make restrictions that forbid
+anyone to deny you these rights or to ask you to surrender the rights.
+These restrictions translate to certain responsibilities for you if you
+distribute copies of the software, or if you modify it.
+
+  For example, if you distribute copies of such a program, whether
+gratis or for a fee, you must give the recipients all the rights that
+you have.  You must make sure that they, too, receive or can get the
+source code.  And you must show them these terms so they know their
+rights.
+
+  We protect your rights with two steps: (1) copyright the software, and
+(2) offer you this license which gives you legal permission to copy,
+distribute and/or modify the software.
+
+  Also, for each author's protection and ours, we want to make certain
+that everyone understands that there is no warranty for this free
+software.  If the software is modified by someone else and passed on, we
+want its recipients to know that what they have is not the original, so
+that any problems introduced by others will not reflect on the original
+authors' reputations.
+
+  Finally, any free program is threatened constantly by software
+patents.  We wish to avoid the danger that redistributors of a free
+program will individually obtain patent licenses, in effect making the
+program proprietary.  To prevent this, we have made it clear that any
+patent must be licensed for everyone's free use or not licensed at all.
+
+  The precise terms and conditions for copying, distribution and
+modification follow.
+
+		    GNU GENERAL PUBLIC LICENSE
+   TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION
+
+  0. This License applies to any program or other work which contains
+a notice placed by the copyright holder saying it may be distributed
+under the terms of this General Public License.  The "Program", below,
+refers to any such program or work, and a "work based on the Program"
+means either the Program or any derivative work under copyright law:
+that is to say, a work containing the Program or a portion of it,
+either verbatim or with modifications and/or translated into another
+language.  (Hereinafter, translation is included without limitation in
+the term "modification".)  Each licensee is addressed as "you".
+
+Activities other than copying, distribution and modification are not
+covered by this License; they are outside its scope.  The act of
+running the Program is not restricted, and the output from the Program
+is covered only if its contents constitute a work based on the
+Program (independent of having been made by running the Program).
+Whether that is true depends on what the Program does.
+
+  1. You may copy and distribute verbatim copies of the Program's
+source code as you receive it, in any medium, provided that you
+conspicuously and appropriately publish on each copy an appropriate
+copyright notice and disclaimer of warranty; keep intact all the
+notices that refer to this License and to the absence of any warranty;
+and give any other recipients of the Program a copy of this License
+along with the Program.
+
+You may charge a fee for the physical act of transferring a copy, and
+you may at your option offer warranty protection in exchange for a fee.
+
+  2. You may modify your copy or copies of the Program or any portion
+of it, thus forming a work based on the Program, and copy and
+distribute such modifications or work under the terms of Section 1
+above, provided that you also meet all of these conditions:
+
+    a) You must cause the modified files to carry prominent notices
+    stating that you changed the files and the date of any change.
+
+    b) You must cause any work that you distribute or publish, that in
+    whole or in part contains or is derived from the Program or any
+    part thereof, to be licensed as a whole at no charge to all third
+    parties under the terms of this License.
+
+    c) If the modified program normally reads commands interactively
+    when run, you must cause it, when started running for such
+    interactive use in the most ordinary way, to print or display an
+    announcement including an appropriate copyright notice and a
+    notice that there is no warranty (or else, saying that you provide
+    a warranty) and that users may redistribute the program under
+    these conditions, and telling the user how to view a copy of this
+    License.  (Exception: if the Program itself is interactive but
+    does not normally print such an announcement, your work based on
+    the Program is not required to print an announcement.)
+
+These requirements apply to the modified work as a whole.  If
+identifiable sections of that work are not derived from the Program,
+and can be reasonably considered independent and separate works in
+themselves, then this License, and its terms, do not apply to those
+sections when you distribute them as separate works.  But when you
+distribute the same sections as part of a whole which is a work based
+on the Program, the distribution of the whole must be on the terms of
+this License, whose permissions for other licensees extend to the
+entire whole, and thus to each and every part regardless of who wrote it.
+
+Thus, it is not the intent of this section to claim rights or contest
+your rights to work written entirely by you; rather, the intent is to
+exercise the right to control the distribution of derivative or
+collective works based on the Program.
+
+In addition, mere aggregation of another work not based on the Program
+with the Program (or with a work based on the Program) on a volume of
+a storage or distribution medium does not bring the other work under
+the scope of this License.
+
+  3. You may copy and distribute the Program (or a work based on it,
+under Section 2) in object code or executable form under the terms of
+Sections 1 and 2 above provided that you also do one of the following:
+
+    a) Accompany it with the complete corresponding machine-readable
+    source code, which must be distributed under the terms of Sections
+    1 and 2 above on a medium customarily used for software interchange; or,
+
+    b) Accompany it with a written offer, valid for at least three
+    years, to give any third party, for a charge no more than your
+    cost of physically performing source distribution, a complete
+    machine-readable copy of the corresponding source code, to be
+    distributed under the terms of Sections 1 and 2 above on a medium
+    customarily used for software interchange; or,
+
+    c) Accompany it with the information you received as to the offer
+    to distribute corresponding source code.  (This alternative is
+    allowed only for noncommercial distribution and only if you
+    received the program in object code or executable form with such
+    an offer, in accord with Subsection b above.)
+
+The source code for a work means the preferred form of the work for
+making modifications to it.  For an executable work, complete source
+code means all the source code for all modules it contains, plus any
+associated interface definition files, plus the scripts used to
+control compilation and installation of the executable.  However, as a
+special exception, the source code distributed need not include
+anything that is normally distributed (in either source or binary
+form) with the major components (compiler, kernel, and so on) of the
+operating system on which the executable runs, unless that component
+itself accompanies the executable.
+
+If distribution of executable or object code is made by offering
+access to copy from a designated place, then offering equivalent
+access to copy the source code from the same place counts as
+distribution of the source code, even though third parties are not
+compelled to copy the source along with the object code.
+
+  4. You may not copy, modify, sublicense, or distribute the Program
+except as expressly provided under this License.  Any attempt
+otherwise to copy, modify, sublicense or distribute the Program is
+void, and will automatically terminate your rights under this License.
+However, parties who have received copies, or rights, from you under
+this License will not have their licenses terminated so long as such
+parties remain in full compliance.
+
+  5. You are not required to accept this License, since you have not
+signed it.  However, nothing else grants you permission to modify or
+distribute the Program or its derivative works.  These actions are
+prohibited by law if you do not accept this License.  Therefore, by
+modifying or distributing the Program (or any work based on the
+Program), you indicate your acceptance of this License to do so, and
+all its terms and conditions for copying, distributing or modifying
+the Program or works based on it.
+
+  6. Each time you redistribute the Program (or any work based on the
+Program), the recipient automatically receives a license from the
+original licensor to copy, distribute or modify the Program subject to
+these terms and conditions.  You may not impose any further
+restrictions on the recipients' exercise of the rights granted herein.
+You are not responsible for enforcing compliance by third parties to
+this License.
+
+  7. If, as a consequence of a court judgment or allegation of patent
+infringement or for any other reason (not limited to patent issues),
+conditions are imposed on you (whether by court order, agreement or
+otherwise) that contradict the conditions of this License, they do not
+excuse you from the conditions of this License.  If you cannot
+distribute so as to satisfy simultaneously your obligations under this
+License and any other pertinent obligations, then as a consequence you
+may not distribute the Program at all.  For example, if a patent
+license would not permit royalty-free redistribution of the Program by
+all those who receive copies directly or indirectly through you, then
+the only way you could satisfy both it and this License would be to
+refrain entirely from distribution of the Program.
+
+If any portion of this section is held invalid or unenforceable under
+any particular circumstance, the balance of the section is intended to
+apply and the section as a whole is intended to apply in other
+circumstances.
+
+It is not the purpose of this section to induce you to infringe any
+patents or other property right claims or to contest validity of any
+such claims; this section has the sole purpose of protecting the
+integrity of the free software distribution system, which is
+implemented by public license practices.  Many people have made
+generous contributions to the wide range of software distributed
+through that system in reliance on consistent application of that
+system; it is up to the author/donor to decide if he or she is willing
+to distribute software through any other system and a licensee cannot
+impose that choice.
+
+This section is intended to make thoroughly clear what is believed to
+be a consequence of the rest of this License.
+
+  8. If the distribution and/or use of the Program is restricted in
+certain countries either by patents or by copyrighted interfaces, the
+original copyright holder who places the Program under this License
+may add an explicit geographical distribution limitation excluding
+those countries, so that distribution is permitted only in or among
+countries not thus excluded.  In such case, this License incorporates
+the limitation as if written in the body of this License.
+
+  9. The Free Software Foundation may publish revised and/or new versions
+of the General Public License from time to time.  Such new versions will
+be similar in spirit to the present version, but may differ in detail to
+address new problems or concerns.
+
+Each version is given a distinguishing version number.  If the Program
+specifies a version number of this License which applies to it and "any
+later version", you have the option of following the terms and conditions
+either of that version or of any later version published by the Free
+Software Foundation.  If the Program does not specify a version number of
+this License, you may choose any version ever published by the Free Software
+Foundation.
+
+  10. If you wish to incorporate parts of the Program into other free
+programs whose distribution conditions are different, write to the author
+to ask for permission.  For software which is copyrighted by the Free
+Software Foundation, write to the Free Software Foundation; we sometimes
+make exceptions for this.  Our decision will be guided by the two goals
+of preserving the free status of all derivatives of our free software and
+of promoting the sharing and reuse of software generally.
+
+			    NO WARRANTY
+
+  11. BECAUSE THE PROGRAM IS LICENSED FREE OF CHARGE, THERE IS NO WARRANTY
+FOR THE PROGRAM, TO THE EXTENT PERMITTED BY APPLICABLE LAW.  EXCEPT WHEN
+OTHERWISE STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES
+PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED
+OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.  THE ENTIRE RISK AS
+TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH YOU.  SHOULD THE
+PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY SERVICING,
+REPAIR OR CORRECTION.
+
+  12. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
+WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY AND/OR
+REDISTRIBUTE THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES,
+INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING
+OUT OF THE USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED
+TO LOSS OF DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY
+YOU OR THIRD PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER
+PROGRAMS), EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE
+POSSIBILITY OF SUCH DAMAGES.
+
+		     END OF TERMS AND CONDITIONS
+
+	    How to Apply These Terms to Your New Programs
+
+  If you develop a new program, and you want it to be of the greatest
+possible use to the public, the best way to achieve this is to make it
+free software which everyone can redistribute and change under these terms.
+
+  To do so, attach the following notices to the program.  It is safest
+to attach them to the start of each source file to most effectively
+convey the exclusion of warranty; and each file should have at least
+the "copyright" line and a pointer to where the full notice is found.
+
+    <one line to give the program's name and a brief idea of what it does.>
+    Copyright (C) 19yy  <name of author>
+
+    This program is free software; you can redistribute it and/or modify
+    it under the terms of the GNU General Public License as published by
+    the Free Software Foundation; either version 2 of the License, or
+    (at your option) any later version.
+
+    This program is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU General Public License for more details.
+
+    You should have received a copy of the GNU General Public License
+    along with this program; see the file COPYING.  If not, write to
+    the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+    Boston, MA 02111-1307, USA.
+
+Also add information on how to contact you by electronic and paper mail.
+
+If the program is interactive, make it output a short notice like this
+when it starts in an interactive mode:
+
+    Gnomovision version 69, Copyright (C) 19yy name of author
+    Gnomovision comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
+    This is free software, and you are welcome to redistribute it
+    under certain conditions; type `show c' for details.
+
+The hypothetical commands `show w' and `show c' should show the appropriate
+parts of the General Public License.  Of course, the commands you use may
+be called something other than `show w' and `show c'; they could even be
+mouse-clicks or menu items--whatever suits your program.
+
+You should also get your employer (if you work as a programmer) or your
+school, if any, to sign a "copyright disclaimer" for the program, if
+necessary.  Here is a sample; alter the names:
+
+  Yoyodyne, Inc., hereby disclaims all copyright interest in the program
+  `Gnomovision' (which makes passes at compilers) written by James Hacker.
+
+  <signature of Ty Coon>, 1 April 1989
+  Ty Coon, President of Vice
+
+This General Public License does not permit incorporating your program into
+proprietary programs.  If your program is a subroutine library, you may
+consider it more useful to permit linking proprietary applications with the
+library.  If this is what you want to do, use the GNU Library General
+Public License instead of this License.
diff --git a/Carpet/CarpetInterp2/README b/Carpet/CarpetInterp2/README
new file mode 100644
index 000000000..6480393c9
--- /dev/null
+++ b/Carpet/CarpetInterp2/README
@@ -0,0 +1,8 @@
+Cactus Code Thorn CarpetInterp2
+Thorn Author(s)     : Erik Schnetter <schnetter@cct.lsu.edu>
+Thorn Maintainer(s) : Erik Schnetter <schnetter@cct.lsu.edu>
+--------------------------------------------------------------------------
+
+Purpose of the thorn:
+
+This thorn provides a parallel interpolator for Carpet.
diff --git a/Carpet/CarpetInterp2/configuration.ccl b/Carpet/CarpetInterp2/configuration.ccl
new file mode 100644
index 000000000..1391494a9
--- /dev/null
+++ b/Carpet/CarpetInterp2/configuration.ccl
@@ -0,0 +1,5 @@
+# Configuration definitions for thorn CarpetInterp2
+
+REQUIRES Carpet CarpetLib
+
+REQUIRES THORNS: Carpet CarpetLib
diff --git a/Carpet/CarpetInterp2/interface.ccl b/Carpet/CarpetInterp2/interface.ccl
new file mode 100644
index 000000000..b161281b8
--- /dev/null
+++ b/Carpet/CarpetInterp2/interface.ccl
@@ -0,0 +1,42 @@
+# Interface definition for thorn CarpetInterp
+
+IMPLEMENTS: interp2
+
+USES INCLUDE HEADER: defs.hh
+USES INCLUDE HEADER: typeprops.hh
+USES INCLUDE HEADER: vect.hh
+
+USES INCLUDE HEADER: carpet.hh
+
+
+
+# Get access to communicators
+CCTK_POINTER_TO_CONST \
+FUNCTION GetMPICommWorld (CCTK_POINTER_TO_CONST IN cctkGH)
+REQUIRES FUNCTION GetMPICommWorld
+
+# Access coordinate information (on the coarse level)
+CCTK_INT FUNCTION GetCoordRange        \
+    (CCTK_POINTER_TO_CONST IN  cctkGH, \
+     CCTK_INT              IN  m,      \
+     CCTK_INT              IN  ml,     \
+     CCTK_INT              IN  size,   \
+     CCTK_INT        ARRAY OUT gsh,    \
+     CCTK_REAL       ARRAY OUT lower,  \
+     CCTK_REAL       ARRAY OUT upper,  \
+     CCTK_REAL       ARRAY OUT delta)
+REQUIRES FUNCTION GetCoordRange
+
+
+
+CCTK_INT FUNCTION                                \
+    MultiPatch_GlobalToLocal                     \
+        (CCTK_POINTER_TO_CONST IN  cctkGH,       \
+         CCTK_INT              IN  ndims,        \
+         CCTK_INT              IN  npoints,      \
+         CCTK_POINTER_TO_CONST IN  globalcoords, \
+         CCTK_INT        ARRAY OUT patch,        \
+         CCTK_POINTER          IN localcoords,   \
+         CCTK_POINTER          IN dadx,          \
+         CCTK_POINTER          IN ddadxdx)
+USES FUNCTION MultiPatch_GlobalToLocal
diff --git a/Carpet/CarpetInterp2/param.ccl b/Carpet/CarpetInterp2/param.ccl
new file mode 100644
index 000000000..9061931b7
--- /dev/null
+++ b/Carpet/CarpetInterp2/param.ccl
@@ -0,0 +1 @@
+# Parameter definitions for thorn CarpetInterp
diff --git a/Carpet/CarpetInterp2/schedule.ccl b/Carpet/CarpetInterp2/schedule.ccl
new file mode 100644
index 000000000..96d18609b
--- /dev/null
+++ b/Carpet/CarpetInterp2/schedule.ccl
@@ -0,0 +1 @@
+# Schedule definitions for thorn CarpetInterp
diff --git a/Carpet/CarpetInterp2/src/fasterp.cc b/Carpet/CarpetInterp2/src/fasterp.cc
new file mode 100644
index 000000000..1c945710f
--- /dev/null
+++ b/Carpet/CarpetInterp2/src/fasterp.cc
@@ -0,0 +1,662 @@
+#include <cassert>
+#include <cmath>
+#include <cstddef>
+#include <cstdlib>
+
+#include <cctk.h>
+
+#include <mpi.h>
+
+#include <carpet.hh>
+
+#include "fasterp.hh"
+
+
+
+namespace CarpetInterp2 {
+  
+  
+  
+  // Create an MPI datatype for location information
+  MPI_Datatype
+  fasterp_iloc_t::mpi_datatype ()
+  {
+    static bool initialised = false;
+    static MPI_Datatype newtype;
+    if (not initialised) {
+      static fasterp_iloc_t s;
+#define ARRSIZE(m) (sizeof(s.m) / sizeof(s.m[0]))
+#define OFFSET(m)  ((char*)&(s.m) - (char*)&(s)) // offsetof doesn't work (why?)
+#define SIZE       (sizeof(s))
+      CCTK_REAL rdummy;
+      dist::mpi_struct_descr_t const descr[] = {
+        {              1, OFFSET(m     ), MPI_INT               },
+        {              1, OFFSET(rl    ), MPI_INT               },
+        {              1, OFFSET(c     ), MPI_INT               },
+        {              1, OFFSET(ind3d ), MPI_INT               },
+        {ARRSIZE(offset), OFFSET(offset), dist::datatype(rdummy)},
+        {              1, SIZE          , MPI_UB                }
+      };
+#undef ARRSIZE
+#undef OFFSET
+#undef SIZE
+      dist::create_mpi_datatype
+        (sizeof(descr) / sizeof(descr[0]), descr, newtype);
+      initialised = true;
+    }
+    return newtype;
+  }
+  
+  
+  
+  //////////////////////////////////////////////////////////////////////////////
+  //////////////////////////////////////////////////////////////////////////////
+  //////////////////////////////////////////////////////////////////////////////
+  
+  
+  
+  // Calculate the coefficients for one interpolation stencil
+  void
+  fasterp_src_loc_t::
+  calc_stencil (fasterp_iloc_t const & iloc,
+                int const order)
+  {
+    assert (order <= max_order);
+    CCTK_REAL const rone = 1.0;
+    CCTK_REAL const eps = 1.0e-12;
+    int const n0 = (order+1) / 2;
+    CCTK_REAL const offset = order % 2 == 0 ? 0.5 : 0.0;
+    for (int d=0; d<dim; ++d) {
+      // C_n = Pi_m[m!=n] [(x_i - x_m) / (x_n - x_m)]
+      CCTK_REAL const xi = iloc.offset[d] - offset;
+      if (order % 2 == 0) {
+        assert (xi >= -rone/2 and xi < +rone/2);
+      } else {
+        assert (xi >= 0 and xi < rone);
+      }
+      if (fabs(xi) >= eps) {
+        assert (fabs(fmod(xi, rone)) <= eps/2);
+        for (int n=0; n<=order; ++n) {
+          CCTK_REAL const xn = n - n0;
+          CCTK_REAL c = 1.0;
+          for (int m=0; m<=order; ++m) {
+            if (m != n) {
+              CCTK_REAL const xm = m - n0;
+              c *= (xi - xm) / (xn - xm);
+            }
+          }
+          coeffs[d][n] = c;
+        }
+        exact[d] = false;
+        // The sum of the coefficients must be one
+        CCTK_REAL s = 0.0;
+        for (int n=0; n<=order; ++n) {
+          s += coeffs[d][n];
+        }
+        assert (fabs(s - rone) <= eps);
+      } else {
+        exact[d] = true;
+      }
+    }
+    ind3d = iloc.ind3d;
+  }
+  
+  
+  
+  // Interpolate a set of variables at the same location, with a given
+  // set of interpolation coefficients.  The template mechanism allows
+  // the order in each direction to be different; in particular, the
+  // order can be 0 if the interpolation location coincides with a
+  // source grid point.  For interpolation to order O, this function
+  // should be instantiated eight times, with On=O and On=0, for
+  // n=[0,1,2].  We hope that the compiler optimises the for loops
+  // away if On=0.
+  template <int O0, int O1, int O2>
+  void
+  fasterp_src_loc_t::
+  interpolate (ivect const & lsh,
+               vector<CCTK_REAL const *> const & varptrs,
+               CCTK_REAL * restrict const vals)
+    const
+  {
+    size_t const di = 1;
+    size_t const dj = di * lsh[0];
+    size_t const dk = dj * lsh[1];
+    
+    for (size_t v=0; v<varptrs.size(); ++v) {
+      vals[v] = 0.0;
+    }
+    
+    for (size_t k=0; k<=O2; ++k) {
+      CCTK_REAL const coeff_k = coeffs[2][k];
+      for (size_t j=0; j<=O1; ++j) {
+        CCTK_REAL const coeff_jk = coeff_k * coeffs[1][j];
+        for (size_t i=0; i<=O0; ++i) {
+          CCTK_REAL const coeff_ijk = coeff_jk * coeffs[0][i];
+          
+          for (size_t v=0; v<varptrs.size(); ++v) {
+            vals[v] += coeff_ijk * varptrs.AT(v)[ind3d + i*di + j*dj + k*dk];
+          } // for v
+          
+        }
+      }
+    }
+  }
+  
+  
+  
+  // Interpolate a set of variables at the same location, with a given
+  // set of interpolation coefficients.  This calls the specialised
+  // interpolation function, depending on whether interpolation is
+  // exact in each of the directions.
+  template <int O>
+  void
+  fasterp_src_loc_t::
+  interpolate (ivect const & lsh,
+               vector<CCTK_REAL const *> const & varptrs,
+               CCTK_REAL * restrict const vals)
+    const
+  {
+    int const Z = 0;
+    if (exact[2]) {
+      if (exact[1]) {
+        if (exact[0]) {
+          interpolate<Z,Z,Z> (lsh, varptrs, vals);
+        } else {
+          interpolate<Z,Z,O> (lsh, varptrs, vals);
+        }
+      } else {
+        if (exact[0]) {
+          interpolate<Z,O,Z> (lsh, varptrs, vals);
+        } else {
+          interpolate<Z,O,O> (lsh, varptrs, vals);
+        }
+      }
+    } else {
+      if (exact[1]) {
+        if (exact[0]) {
+          interpolate<O,Z,Z> (lsh, varptrs, vals);
+        } else {
+          interpolate<O,Z,O> (lsh, varptrs, vals);
+        }
+      } else {
+        if (exact[0]) {
+          interpolate<O,O,Z> (lsh, varptrs, vals);
+        } else {
+          interpolate<O,O,O> (lsh, varptrs, vals);
+        }
+      }
+    }
+  }
+  
+  
+  
+  // Interpolate a set of variables at the same location, with a given
+  // set of interpolation coefficients.  This calls a specialised
+  // interpolation function, depending on whether interpolation is
+  // exact in each of the directions.
+  void
+  fasterp_src_loc_t::
+  interpolate (ivect const & lsh,
+               int const order,
+               vector<CCTK_REAL const *> const & varptrs,
+               CCTK_REAL * restrict const vals)
+    const
+  {
+    switch (order) {
+    case  0: interpolate< 0> (lsh, varptrs, vals); break;
+    case  1: interpolate< 1> (lsh, varptrs, vals); break;
+    case  2: interpolate< 2> (lsh, varptrs, vals); break;
+    case  3: interpolate< 3> (lsh, varptrs, vals); break;
+    case  4: interpolate< 4> (lsh, varptrs, vals); break;
+    case  5: interpolate< 5> (lsh, varptrs, vals); break;
+    case  6: interpolate< 6> (lsh, varptrs, vals); break;
+    case  7: interpolate< 7> (lsh, varptrs, vals); break;
+    case  8: interpolate< 8> (lsh, varptrs, vals); break;
+    case  9: interpolate< 9> (lsh, varptrs, vals); break;
+    case 10: interpolate<10> (lsh, varptrs, vals); break;
+    case 11: interpolate<11> (lsh, varptrs, vals); break;
+    default:
+      // Add higher orders here as desired
+      CCTK_WARN (CCTK_WARN_ABORT, "Interpolation orders larger than 11 are not yet implemented");
+      assert (0);
+    }
+  }
+  
+  
+  
+  //////////////////////////////////////////////////////////////////////////////
+  //////////////////////////////////////////////////////////////////////////////
+  //////////////////////////////////////////////////////////////////////////////
+  
+  
+  
+  // Set up an interpolation
+  fasterp_setup_t::
+  fasterp_setup_t (cGH const * restrict const cctkGH,
+                   fasterp_glocs_t const & locations,
+                   int const order_)
+    : order (order_)
+  {
+    // Some global properties
+    int const npoints = locations.size();
+    int const nprocs = CCTK_nProcs (cctkGH);
+    // int const myproc = CCTK_MyProc (cctkGH);
+    
+    
+    
+    // Calculate patch numbers and local coordinates
+    fasterp_llocs_t local_locations (npoints);
+    
+    if (CCTK_IsFunctionAliased ("MultiPatch_GlobalToLocal")) {
+      // This is a muulti-patch simulation: convert global to local
+      // coordinates
+      
+      CCTK_REAL const * coords[dim];
+      CCTK_REAL       * local_coords[dim];
+      for (int d=0; d<dim; ++d) {
+        coords[d]       = &locations.coords[d].front();
+        local_coords[d] = &local_locations.coords[d].front();
+      }
+      
+      int const ierr = MultiPatch_GlobalToLocal
+        (cctkGH, dim, npoints,
+         coords,
+         &local_locations.maps.front(), local_coords, NULL, NULL);
+      assert (not ierr);
+      
+    } else {
+      // This is a single-patch simulation
+      
+      // TODO: Optimise this: don't copy coordinates, and don't store
+      // map numbers if there is only one map.
+      for (int n=0; n<npoints; ++n) {
+        int const m = 0;
+        local_locations.maps.AT(n) = m;
+        for (int d=0; d<dim; ++d) {
+          local_locations.coords[d].AT(n) = locations.coords[d].AT(n);
+        }
+      }
+      
+    } // if not multi-patch
+    
+    // Obtain the coordinate ranges for all patches
+    vector<rvect> lower (Carpet::maps);
+    vector<rvect> upper (Carpet::maps);
+    vector<rvect> delta (Carpet::maps); // spacing on finest possible grid
+    for (int m=0; m<Carpet::maps; ++m) {
+      jvect gsh;
+      int const ierr =
+        GetCoordRange (cctkGH, m, Carpet::mglevel, dim,
+                       & gsh[0],
+                       & lower.AT(m)[0], & upper.AT(m)[0], & delta.AT(m)[0]);
+      assert (not ierr);
+      delta.AT(m) /= Carpet::maxspacereflevelfact;
+    }
+    
+    // Calculate refinement levels, components, and integer grid point
+    // indices
+    vector<fasterp_iloc_t> ilocs (npoints);
+    vector<int> proc (npoints);
+    vector<int> nlocs (nprocs, 0);
+    int n_nz_nlocs = 0;
+    assert (Carpet::is_level_mode());
+    for (int n=0; n<npoints; ++n) {
+      int const m = local_locations.maps.AT(n);
+      rvect const pos (local_locations.coords[0].AT(n),
+                       local_locations.coords[1].AT(n),
+                       local_locations.coords[2].AT(n));
+      
+      gh const * const hh = Carpet::vhh.AT(m);
+      ibbox const & baseext = hh->baseextent(Carpet::mglevel, 0);
+      rvect const rpos =
+        (pos - lower.AT(m)) / (upper.AT(m) - lower.AT(m)) *
+        rvect (baseext.upper() - baseext.lower());
+      
+      // Find refinement level and component
+      int rl, c;
+      ivect ipos;
+      hh->locate_position (rpos,
+                           Carpet::mglevel,
+                           Carpet::reflevel, Carpet::reflevel+1,
+                           rl, c, ipos);
+      
+      ibbox const & ext =
+        Carpet::vdd.AT(m)->boxes.AT(Carpet::mglevel).AT(rl).AT(c).exterior;
+      
+      rvect dpos = rpos - rvect(ipos);
+      if (order % 2 != 0) {
+        // Potentially shift the stencil anchor for odd interpolation
+        // orders (i.e., for even numbers of stencil points)
+        ipos -= either (dpos > rvect(0), ext.stride(), ivect(0));
+        dpos = rpos - rvect(ipos);
+      }
+      
+      ivect const ind = ipos - ext.lower() / ext.stride();
+      ivect const lsh = ext.shape() / ext.stride();
+      int const ind3d = ind[0] + lsh[0] * (ind[1] + lsh[1] * ind[2]);
+      
+      // Store result
+      fasterp_iloc_t & iloc = ilocs.AT(n);
+      iloc.m      = m;
+      iloc.rl     = rl;
+      iloc.c      = c;
+      iloc.ind3d  = ind3d;
+      iloc.offset = dpos;
+      
+      // Find source processor
+      int const p = Carpet::vhh.AT(m)->processor(rl,c);
+      proc.AT(n) = p;
+      if (nlocs.AT(p) == 0) ++n_nz_nlocs;
+      ++ nlocs.AT(p);
+    }
+    
+    
+    
+    // Find mapping from processors to "processor indices": It may be
+    // too expensive to store data for all processors, so we store
+    // only data about those processors with which we actually
+    // communicate.
+    {
+      recv_descr.procs.resize (n_nz_nlocs);
+      recv_descr.procinds.resize (nprocs, -1);
+      int pp = 0;
+      int offset = 0;
+      for (int p=0; p<nprocs; ++p) {
+        if (nlocs.AT(p) > 0) {
+          recv_descr.procs.AT(pp).p       = p;
+          recv_descr.procs.AT(pp).offset  = offset;
+          recv_descr.procs.AT(pp).npoints = nlocs.AT(p);
+          recv_descr.procinds.AT(p) = pp;
+          ++ pp;
+          offset += nlocs.AT(p);
+        }
+      }
+      assert (pp == n_nz_nlocs);
+      assert (offset == npoints);
+      recv_descr.npoints = npoints;
+    }
+    
+    // Create a mapping "index" from location index, as specified by
+    // the user, to the index order in which the data are received
+    // from the other processors.
+    {
+      vector<int> index (recv_descr.procs.size());
+      for (int pp=0; pp<int(recv_descr.procs.size()); ++pp) {
+        index.AT(pp) = recv_descr.procs.AT(pp).offset;
+      }
+      recv_descr.index.resize (npoints);
+      for (int n=0; n<npoints; ++n) {
+        int const p = proc.AT(n);
+        int const pp = recv_descr.procinds.AT(p);
+        assert (pp >= 0);
+        recv_descr.index.AT(n) = index.AT(pp);
+        ++index.AT(pp);
+      }
+      for (int pp=0; pp<int(recv_descr.procs.size()); ++pp) {
+        int const recv_npoints = index.AT(pp) - recv_descr.procs.AT(pp).offset;
+        assert (recv_npoints == recv_descr.procs.AT(pp).npoints);
+      }
+    }
+    
+    
+    
+    // Count the number of points which have to be sent to other
+    // processors, and exchange this information with MPI
+    vector<int> send_npoints (nprocs, 0), send_offsets (nprocs);
+    {
+      int offset = 0;
+      for (int pp=0; pp<int(recv_descr.procs.size()); ++pp) {
+        int const p = recv_descr.procs.AT(pp).p;
+        send_npoints.AT(p) = recv_descr.procs.AT(pp).npoints;
+        send_offsets.AT(p) = offset;
+        offset += send_npoints.AT(p);
+      }
+      assert (offset == npoints);
+    }
+    vector<int> recv_npoints (nprocs), recv_offsets (nprocs);
+    MPI_Alltoall (&send_npoints.front(), 1, MPI_INT,
+                  &recv_npoints.front(), 1, MPI_INT,
+                  MPI_COMM_WORLD);
+    int npoints_source = 0;
+    for (int p=0; p<nprocs; ++p) {
+      recv_offsets.AT(p) = npoints_source;
+      npoints_source += recv_npoints.AT(p);
+    }
+    
+    // Scatter the location information into a send-array, and
+    // exchange it with MPI
+    vector<fasterp_iloc_t> scattered_ilocs(npoints);
+    for (int n=0; n<npoints; ++n) {
+      scattered_ilocs.AT(recv_descr.index.AT(n)) = ilocs.AT(n);
+    }
+    vector<fasterp_iloc_t> gathered_ilocs(npoints_source);
+    MPI_Comm & comm_world = * (MPI_Comm *) GetMPICommWorld (cctkGH);
+    MPI_Alltoallv
+      (&scattered_ilocs.front(), &send_npoints.front(), &send_offsets.front(),
+       fasterp_iloc_t::mpi_datatype(),
+       &gathered_ilocs.front(),  &recv_npoints.front(), &recv_offsets.front(),
+       fasterp_iloc_t::mpi_datatype(),
+       comm_world);
+    
+    
+    
+    // Fill in send descriptors
+    send_descr.npoints = npoints_source;
+    
+    {
+      int n_nz_recv_npoints = 0;
+      for (int p=0; p<nprocs; ++p) {
+        if (recv_npoints.AT(p) > 0) ++n_nz_recv_npoints;
+      }
+      send_descr.procs.resize (n_nz_recv_npoints);
+      int pp = 0;
+      for (int p=0; p<nprocs; ++p) {
+        if (recv_npoints.AT(p) > 0) {
+          send_proc_t & send_proc = send_descr.procs.AT(pp);
+          send_proc.p       = p;
+          send_proc.offset  = recv_offsets.AT(p);
+          send_proc.npoints = recv_npoints.AT(p);
+          ++pp;
+        }
+      }
+      assert (pp == n_nz_recv_npoints);
+    }
+    
+    for (size_t pp=0; pp<send_descr.procs.size(); ++pp) {
+      send_proc_t & send_proc = send_descr.procs.AT(pp);
+      
+      send_proc.maps.resize (Carpet::maps);
+      for (int m=0; m<Carpet::maps; ++m) {
+        send_proc.maps.AT(m).rls.resize (Carpet::reflevels);
+        for (int rl=0; rl<Carpet::reflevels; ++rl) {
+          int const ncomps = Carpet::vhh.AT(m)->components (rl);
+          send_proc.maps.AT(m).rls.AT(rl).compinds.resize (ncomps, -1);
+        }
+      }
+      
+      vector<vector<vector<int> > > npoints_comp (Carpet::maps);
+      for (int m=0; m<Carpet::maps; ++m) {
+        npoints_comp.AT(m).resize(Carpet::reflevels);
+        for (int rl=0; rl<Carpet::reflevels; ++rl) {
+          int const ncomps = Carpet::vhh.AT(m)->components (rl);
+          npoints_comp.AT(m).AT(rl).resize(ncomps, 0);
+        }
+      }
+      
+      vector<vector<int> > n_nz_npoints_comp (Carpet::maps);
+      for (int m=0; m<Carpet::maps; ++m) {
+        n_nz_npoints_comp.AT(m).resize(Carpet::reflevels, 0);
+      }
+      
+      for (int n=0; n<send_proc.npoints; ++n) {
+        fasterp_iloc_t const & iloc = gathered_ilocs.AT(send_proc.offset + pp);
+        int const m  = iloc.m;
+        int const rl = iloc.rl;
+        int const c  = iloc.c;
+        if (npoints_comp.AT(m).AT(rl).AT(c) == 0) {
+          ++ n_nz_npoints_comp.AT(m).AT(rl);
+        }
+        ++ npoints_comp.AT(m).AT(rl).AT(c);
+      }
+      
+      for (int m=0; m<Carpet::maps; ++m) {
+        for (int rl=0; rl<Carpet::reflevels; ++rl) {
+          send_proc.maps.AT(m).rls.AT(rl).comps.resize
+            (n_nz_npoints_comp.AT(m).AT(rl));
+          int cc = 0;
+          int const ncomps = Carpet::vhh.AT(m)->components (rl);
+          for (int c=0; c<ncomps; ++c) {
+            if (npoints_comp.AT(m).AT(rl).AT(c) > 0) {
+              send_comp_t & comp = send_proc.maps.AT(m).rls.AT(rl).comps.AT(cc);
+              comp.locs.clear();
+              comp.locs.reserve (npoints_comp.AT(m).AT(rl).AT(c));
+              comp.c = c;
+              send_proc.maps.AT(m).rls.AT(rl).compinds.AT(c) = cc;
+              ++cc;
+            }
+          }
+        }
+      }
+      
+    } // for pp
+    
+    
+    
+    // Calculate stencil coefficients
+    for (size_t pp=0; pp<send_descr.procs.size(); ++pp) {
+      send_proc_t & send_proc = send_descr.procs.AT(pp);
+      for (int n=0; n<send_proc.npoints; ++n) {
+        fasterp_iloc_t const & iloc = gathered_ilocs.AT(send_proc.offset+pp);
+        int const m  = iloc.m;
+        int const rl = iloc.rl;
+        int const c  = iloc.c;
+        
+        fasterp_src_loc_t sloc;
+        sloc.calc_stencil (iloc, order);
+        
+        int const cc = send_proc.maps.AT(m).rls.AT(rl).compinds.AT(c);
+        send_comp_t & comp = send_proc.maps.AT(m).rls.AT(rl).comps.AT(cc);
+        comp.locs.push_back (sloc);
+      }
+    } // for pp
+  }
+  
+  
+  
+  // Free the setup for one interpolation
+  fasterp_setup_t::
+  ~fasterp_setup_t ()
+  {
+    // do nothing -- C++ calls destructors automatically
+  }
+  
+  
+  
+  // Interpolate
+  void 
+  fasterp_setup_t::
+  interpolate (cGH const * restrict const cctkGH,
+               vector<int> const & varinds,
+               vector<CCTK_REAL *> & values)
+    const
+  {
+    size_t const nvars = varinds.size();
+    assert (values.size() == nvars);
+    for (size_t v=0; v<values.size(); ++v) {
+      assert (varinds.AT(v) >= 0 and varinds.AT(v) <= CCTK_NumVars());
+      // Ensure that variable is GF
+      // Ensure that variable has "good" type
+      // Ensure that variable has storage
+      assert (values.AT(v) != NULL);
+    }
+    
+    MPI_Comm & comm_world = * (MPI_Comm *) GetMPICommWorld (cctkGH);
+    
+    // Post Irecvs
+    vector<CCTK_REAL> recv_points (recv_descr.npoints * nvars);
+    vector<MPI_Request> recv_reqs (recv_descr.procs.size());
+    for (size_t pp=0; pp<recv_descr.procs.size(); ++pp) {
+      recv_proc_t const & recv_proc = recv_descr.procs.AT(pp);
+      
+      CCTK_REAL rdummy;
+      int const tag = 0;
+      MPI_Irecv (& recv_points.AT(recv_proc.offset * nvars),
+                 recv_proc.npoints * nvars,
+                 dist::datatype (rdummy), recv_proc.p, tag,
+                 comm_world, & recv_reqs.AT(pp));
+    }
+    
+    // Interpolate data and post Isends
+    vector<CCTK_REAL> send_points (send_descr.npoints);
+    vector<CCTK_REAL>::iterator destit = send_points.begin();
+    vector<MPI_Request> send_reqs (send_descr.procs.size());
+    for (size_t pp=0; pp<send_descr.procs.size(); ++pp) {
+      send_proc_t const & send_proc = send_descr.procs.AT(pp);
+      
+      for (size_t m=0; m<send_proc.maps.size(); ++m) {
+        send_map_t const & send_map = send_proc.maps.AT(m);
+        for (size_t rl=0; rl<send_map.rls.size(); ++rl) {
+          send_rl_t const & send_rl = send_map.rls.AT(rl);
+          for (size_t cc=0; cc<send_rl.comps.size(); ++cc) {
+            send_comp_t const & send_comp = send_rl.comps.AT(cc);
+            int const c = send_comp.c;
+            
+            dh const & dd = * Carpet::vdd.AT(m);
+            ibbox const &
+              ext = dd.boxes.AT(Carpet::mglevel).AT(rl).AT(c).exterior;
+            ivect const lsh = ext.shape() / ext.stride();
+            
+            // Get pointers to 3D data
+            vector<CCTK_REAL const *> varptrs (nvars);
+            for (size_t v=0; v<nvars; ++v) {
+              int const gi = CCTK_GroupIndexFromVarI (varinds.AT(v));
+              assert (gi >= 0);
+              int const vi = varinds.AT(v) - CCTK_FirstVarIndexI (gi);
+              assert (vi >= 0);
+              int const tl = 0;
+              varptrs.AT(v) =
+                (CCTK_REAL const *)
+                (* Carpet::arrdata.AT(gi).AT(m).data.AT(vi))
+                (tl, rl, c, Carpet::mglevel)->storage();
+              assert (varptrs.AT(v));
+            }
+            
+            for (size_t n=0; n<send_comp.locs.size(); ++n) {
+              assert (destit + nvars <= send_points.end());
+              send_comp.locs.AT(n).interpolate
+                (lsh, order, varptrs, & * destit);
+              destit += nvars;
+            }
+            
+          } // for cc
+        }   // for rl
+      }     // for m
+      
+      CCTK_REAL rdummy;
+      int const tag = 0;
+      MPI_Isend (& send_points.AT(send_proc.offset * nvars),
+                 send_proc.npoints * nvars,
+                 dist::datatype (rdummy), send_proc.p, tag,
+                 comm_world, & send_reqs.AT(pp));
+    } // for pp
+    assert (destit == send_points.end());
+    
+    // Wait for Irecvs to complete
+    MPI_Waitall (recv_reqs.size(), & recv_reqs.front(), MPI_STATUSES_IGNORE);
+    
+    // Gather data
+    for (int n=0; n<recv_descr.npoints; ++n) {
+      int const nn = recv_descr.index.AT(n);
+      for (size_t v=0; v<nvars; ++v) {
+        values.AT(v)[n] = recv_points.AT(nn);
+      }
+    }
+    
+    // Wait for Isends to complete
+    MPI_Waitall (send_reqs.size(), & send_reqs.front(), MPI_STATUSES_IGNORE);
+  }
+  
+  
+  
+} // namespace CarpetInterp2
diff --git a/Carpet/CarpetInterp2/src/fasterp.hh b/Carpet/CarpetInterp2/src/fasterp.hh
new file mode 100644
index 000000000..84b20da80
--- /dev/null
+++ b/Carpet/CarpetInterp2/src/fasterp.hh
@@ -0,0 +1,186 @@
+#ifndef FASTERP_HH
+#define FASTERP_HH
+
+#include <cstdlib>
+#include <vector>
+
+#include <cctk.h>
+
+#include <defs.hh>
+#include <dist.hh>
+#include <typeprops.hh>
+#include <vect.hh>
+
+
+
+namespace CarpetInterp2 {
+  
+  using namespace std;
+  
+  
+  
+  int const dim = 3;
+  
+  // An interpolation point descriptor requires (3 * (max_order+1) +
+  // 1) double precision values of memory
+  int const max_order = 5;
+  
+  
+  
+  // A global location, given by its global coordinates
+  struct fasterp_glocs_t {
+    vector<CCTK_REAL> coords[dim];
+    fasterp_glocs_t (size_t const n)
+    {
+      for (int d=0; d<dim; ++d) {
+        coords[d].resize(n);
+      }
+    }
+    size_t size () const { return coords[0].size(); }
+  };
+  
+  // A local location, given by map and local coordinates
+  struct fasterp_llocs_t {
+    vector<int> maps;
+    vector<CCTK_REAL> coords[dim];
+    fasterp_llocs_t (size_t const n)
+    {
+      maps.resize(n);
+      for (int d=0; d<dim; ++d) {
+        coords[d].resize(n);
+      }
+    }
+    size_t size () const { return maps.size(); }
+  };
+  
+  // An integer location, given by map, refinement level, and
+  // component
+  struct fasterp_iloc_t {
+    int m, rl, c;
+    
+    // ivect idx;
+    int ind3d;
+    rvect offset;               // in terms of grid points
+    
+    static MPI_Datatype mpi_datatype ();
+  };
+  
+  
+  
+  struct fasterp_dest_loc_t {
+    // ivect idx;
+    int ind3d;                  // destination grid point index
+  };
+  
+  class fasterp_src_loc_t {
+    CCTK_REAL coeffs[dim][max_order+1]; // interpolation coefficients
+    bvect exact;
+    
+    // ivect idx;
+    int ind3d;                  // source grid point offset
+    
+  public:
+    void
+    calc_stencil (fasterp_iloc_t const & iloc,
+                  int order);
+    void
+    interpolate (ivect const & lsh,
+                 int order,
+                 vector<CCTK_REAL const *> const & varptrs,
+                 CCTK_REAL * restrict vals)
+      const;
+    
+  private:
+    template <int O>
+    void
+    interpolate (ivect const & lsh,
+                 vector<CCTK_REAL const *> const & varptrs,
+                 CCTK_REAL * restrict vals)
+      const;
+    template <int O0, int O1, int O2>
+    void
+    interpolate (ivect const & lsh,
+                 vector<CCTK_REAL const *> const & varptrs,
+                 CCTK_REAL * restrict vals)
+      const;
+  };
+  
+  
+  
+  // A receive descriptor, describing what is received from other
+  // processors
+  struct recv_proc_t {
+    int p;                      // sending processor
+    int offset;
+    int npoints;                // total number of received points
+  };
+
+  struct recv_descr_t {
+    vector<recv_proc_t> procs;
+    vector<int> procinds;
+    int npoints;                // total number of received points
+    
+    vector<int> index;          // gather index list
+  };
+  
+  // A send descriptor; describing what to send to other processors
+  struct send_comp_t {
+    // This structure does not exist for all components -- components
+    // which are not accessed are not described, making this a sparse
+    // data structure.  The field c contains the component number.
+    vector<fasterp_src_loc_t> locs;
+    int c;                      // source component
+  };
+  
+  struct send_rl_t {
+    vector<send_comp_t> comps;
+    vector<int> compinds;
+  };
+  
+  struct send_map_t {
+    vector<send_rl_t> rls;
+  };
+
+  struct send_proc_t {
+    // This structure does not exist for all processors -- processors
+    // with which there is no communication are not described, making
+    // this a sparse data structure.  The field p contains the
+    // processor number.
+    vector<send_map_t> maps;
+    int p;                      // receiving processor
+    int offset;
+    int npoints;                // total number of sent points
+  };
+  
+  struct send_descr_t {
+    vector<send_proc_t> procs;
+    // vector<int> procinds;
+    int npoints;                // total number of sent points
+  };
+  
+  
+  
+  class fasterp_setup_t {
+    recv_descr_t recv_descr;
+    send_descr_t send_descr;
+    int order;
+    
+  public:
+    fasterp_setup_t (cGH const * restrict cctkGH,
+                     fasterp_glocs_t const & locations,
+                     int order);
+    
+    ~ fasterp_setup_t ();
+    
+    void 
+    interpolate (cGH const * restrict cctkGH,
+                 vector<int> const & varinds,
+                 vector<CCTK_REAL *> & values)
+      const;
+  };
+  
+  
+  
+} // namespace CarpetInterp2
+
+#endif  // #define FASTERP_HH
diff --git a/Carpet/CarpetInterp2/src/make.code.defn b/Carpet/CarpetInterp2/src/make.code.defn
new file mode 100644
index 000000000..d95df47d6
--- /dev/null
+++ b/Carpet/CarpetInterp2/src/make.code.defn
@@ -0,0 +1,8 @@
+# Main make.code.defn file for thorn CarpetInterp2
+
+# Source files in this directory
+SRCS = fasterp.cc
+
+# Subdirectories containing source files
+SUBDIRS = 
+
diff --git a/Carpet/CarpetLib/interface.ccl b/Carpet/CarpetLib/interface.ccl
index 44b7729d5..6e7462678 100644
--- a/Carpet/CarpetLib/interface.ccl
+++ b/Carpet/CarpetLib/interface.ccl
@@ -4,6 +4,7 @@ IMPLEMENTS: CarpetLib
 
 includes header: defs.hh in defs.hh
 includes header: dist.hh in dist.hh
+includes header: typeprops.hh in typeprops.hh
 
 includes header: bbox.hh in bbox.hh
 includes header: bboxset.hh in bboxset.hh
diff --git a/Carpet/CarpetLib/param.ccl b/Carpet/CarpetLib/param.ccl
index c1d3754ec..45724f25d 100644
--- a/Carpet/CarpetLib/param.ccl
+++ b/Carpet/CarpetLib/param.ccl
@@ -85,6 +85,14 @@ STRING memstat_file "File name in which memstat output is collected (because std
 
 
 
+# Experimental recomposing parameters
+
+BOOLEAN combine_recompose "Recompose all grid functions of one refinement levels at once" STEERABLE=always
+{
+} "no"
+
+
+
 # Experimental communication parameters
 
 BOOLEAN interleave_communications "Try to interleave communications with each other; each processor begins to communicate with its 'right neighbour' in rank, instead of with the root processor" STEERABLE=always
diff --git a/Carpet/CarpetLib/src/commstate.cc b/Carpet/CarpetLib/src/commstate.cc
index b6ed4095a..7a00157c2 100644
--- a/Carpet/CarpetLib/src/commstate.cc
+++ b/Carpet/CarpetLib/src/commstate.cc
@@ -1,6 +1,7 @@
 #include <cassert>
 #include <cstdlib>
 #include <cstring>
+#include <iostream>
 
 #include "cctk.h"
 #include "cctk_Parameters.h"
@@ -115,7 +116,7 @@ void comm_state::step ()
           if (commstate_verbose) {
             CCTK_INFO ("Finished MPI_Irecv");
           }
-          timer.stop (0);
+          timer.stop (procbuf.recvbufsize * datatypesize);
           num_posted_recvs++;
         }
       }
diff --git a/Carpet/CarpetLib/src/commstate.hh b/Carpet/CarpetLib/src/commstate.hh
index 8cc8d40b4..c01f732da 100644
--- a/Carpet/CarpetLib/src/commstate.hh
+++ b/Carpet/CarpetLib/src/commstate.hh
@@ -1,6 +1,7 @@
 #ifndef COMMSTATE_HH
 #define COMMSTATE_HH
 
+#include <cstdlib>
 #include <queue>
 #include <vector>
 
diff --git a/Carpet/CarpetLib/src/defs.hh b/Carpet/CarpetLib/src/defs.hh
index 1152c154a..d1d8b73f0 100644
--- a/Carpet/CarpetLib/src/defs.hh
+++ b/Carpet/CarpetLib/src/defs.hh
@@ -62,24 +62,32 @@ template<typename T, int D> class bbox;
 template<typename T, int D> class bboxset;
 template<typename T, int D, typename P> class fulltree;
 
-struct pseudoregion_t;
-struct region_t;
-
-typedef vect<bool,dim>   bvect;
-typedef vect<int,dim>    ivect;
-typedef bbox<int,dim>    ibbox;
-typedef bboxset<int,dim> ibset;
-typedef fulltree<int,dim,pseudoregion_t> ipfulltree;
-
+typedef vect<bool,dim>      bvect;
+typedef vect<int,dim>       ivect;
+typedef vect<CCTK_INT,dim>  jvect;
+typedef vect<CCTK_REAL,dim> rvect;
+typedef bbox<int,dim>       ibbox;
+typedef bbox<CCTK_INT,dim>  jbbox;
+typedef bbox<CCTK_REAL,dim> rbbox;
+typedef bboxset<int,dim>    ibset;
+  
 // (Try to replace these by b2vect and i2vect)
 typedef vect<vect<bool,2>,dim> bbvect;
 typedef vect<vect<int,2>,dim>  iivect;
+typedef vect<vect<CCTK_INT,2>,dim> jjvect;
 
 typedef vect<vect<bool,dim>,2> b2vect;
 typedef vect<vect<int,dim>,2>  i2vect;
 
 
 
+struct pseudoregion_t;
+struct region_t;
+
+typedef fulltree<int,dim,pseudoregion_t> ipfulltree;
+
+
+
 // A general type
 enum centering { error_centered, vertex_centered, cell_centered };
 
diff --git a/Carpet/CarpetLib/src/dh.cc b/Carpet/CarpetLib/src/dh.cc
index fa990a2b0..a3d50d08a 100644
--- a/Carpet/CarpetLib/src/dh.cc
+++ b/Carpet/CarpetLib/src/dh.cc
@@ -71,7 +71,6 @@ inline
 int
 dh::this_proc (int const rl, int const c) const
 {
-  // return c % dist::size();
   return h.processor (rl, c);
 }
 
@@ -1006,6 +1005,8 @@ void
 dh::
 recompose (int const rl, bool const do_prolongate)
 {
+  DECLARE_CCTK_PARAMETERS;
+  
   assert (rl>=0 and rl<h.reflevels());
   
   static Timer timer ("dh::recompose");
@@ -1015,13 +1016,31 @@ recompose (int const rl, bool const do_prolongate)
     (*f)->recompose_crop ();
   }
   
-  for (list<ggf*>::iterator f=gfs.begin(); f!=gfs.end(); ++f) {
-    (*f)->recompose_allocate (rl);
+  if (combine_recompose) {
+    // Recompose all grid functions of this refinement levels at once.
+    // This may be faster, but requires more memory.
+    for (list<ggf*>::iterator f=gfs.begin(); f!=gfs.end(); ++f) {
+      (*f)->recompose_allocate (rl);
+    }
     for (comm_state state; not state.done(); state.step()) {
-      (*f)->recompose_fill (state, rl, do_prolongate);
+      for (list<ggf*>::iterator f=gfs.begin(); f!=gfs.end(); ++f) {
+        (*f)->recompose_fill (state, rl, do_prolongate);
+      }
     }
-    (*f)->recompose_free_old (rl);
-  } // for all grid functions of same vartype
+    for (list<ggf*>::iterator f=gfs.begin(); f!=gfs.end(); ++f) {
+      (*f)->recompose_free_old (rl);
+    }
+  } else {
+    // Recompose the grid functions sequentially.  This may be slower,
+    // but requires less memory.  This is the default.
+    for (list<ggf*>::iterator f=gfs.begin(); f!=gfs.end(); ++f) {
+      (*f)->recompose_allocate (rl);
+      for (comm_state state; not state.done(); state.step()) {
+        (*f)->recompose_fill (state, rl, do_prolongate);
+      }
+      (*f)->recompose_free_old (rl);
+    }
+  }
   
   timer.stop (0);
 }
diff --git a/Carpet/CarpetLib/src/dist.cc b/Carpet/CarpetLib/src/dist.cc
index 7ac6f73f6..c870990fb 100644
--- a/Carpet/CarpetLib/src/dist.cc
+++ b/Carpet/CarpetLib/src/dist.cc
@@ -53,6 +53,27 @@ namespace dist {
     MPI_Finalize ();
   }
   
+  
+  
+  // Create an MPI datatype from a C datatype description
+  void create_mpi_datatype (size_t const count,
+                            mpi_struct_descr_t const descr[],
+                            MPI_Datatype & newtype)
+  {
+    int blocklengths[count];
+    MPI_Aint displacements[count];
+    MPI_Datatype types[count];
+    for (size_t n=0; n<count; ++n) {
+      blocklengths [n] = descr[n].blocklength;
+      displacements[n] = descr[n].displacement;
+      types        [n] = descr[n].type;
+    }
+    MPI_Type_struct (count, blocklengths, displacements, types, &newtype);
+    MPI_Type_commit (&newtype);
+  }
+  
+  
+  
   void checkpoint (const char* file, int line) {
     DECLARE_CCTK_PARAMETERS;
     if (verbose) {
diff --git a/Carpet/CarpetLib/src/dist.hh b/Carpet/CarpetLib/src/dist.hh
index ae7953f99..cf4cbd70c 100644
--- a/Carpet/CarpetLib/src/dist.hh
+++ b/Carpet/CarpetLib/src/dist.hh
@@ -30,6 +30,19 @@ namespace dist {
   void pseudoinit (MPI_Comm const c);
   void finalize ();
   
+  // Create MPI datatypes from C structures
+  struct mpi_struct_descr_t {
+    int          blocklength;
+    MPI_Aint     displacement;
+    MPI_Datatype type;
+  };
+  
+  void create_mpi_datatype (size_t const count,
+                            mpi_struct_descr_t const descr[],
+                            MPI_Datatype & newtype);
+  
+  
+  
   // Debugging output
 #define CHECKPOINT dist::checkpoint(__FILE__, __LINE__)
   void checkpoint (const char* file, int line);
diff --git a/Carpet/CarpetLib/src/gf.hh b/Carpet/CarpetLib/src/gf.hh
index 0ca125631..d5feb0a63 100644
--- a/Carpet/CarpetLib/src/gf.hh
+++ b/Carpet/CarpetLib/src/gf.hh
@@ -50,12 +50,14 @@ protected:
   
   virtual gdata* typed_data (int tl, int rl, int c, int ml)
   {
+    data<T>* const vl =
+      this->vectorleader
+      ? (data<T>*)(*this->vectorleader)(tl,rl,c,ml)
+      : NULL;
     return new data<T>(this->varindex,
                        h.refcent, this->transport_operator,
                        this->vectorlength, this->vectorindex,
-                       this->vectorleader
-                       ? (data<T>*)(*this->vectorleader)(tl,rl,c,ml)
-                       : NULL);
+                       vl);
   }
   
   
diff --git a/Carpet/CarpetLib/src/gh.cc b/Carpet/CarpetLib/src/gh.cc
index 9b4a5f443..9a04af1df 100644
--- a/Carpet/CarpetLib/src/gh.cc
+++ b/Carpet/CarpetLib/src/gh.cc
@@ -272,6 +272,106 @@ local_components (int const rl)
 
 
 
+// Find the refinement level and component to which a grid point
+// belongs.  This uses a tree search over the superregions in the grid
+// struction, which should scale reasonably (O(n log n)) better with
+// the number of componets components.
+void
+gh::
+locate_position (rvect const & rpos,
+                 int const ml,
+                 int const minrl, int const maxrl,
+                 int & rl, int & c, ivect & aligned_ipos) const
+{
+  assert (ml>=0 and ml<mglevels());
+  assert (minrl>=0 and minrl<=maxrl and maxrl<=reflevels());
+  
+  // Try finer levels first
+  for (rl = maxrl-1; rl >= minrl; --rl) {
+    
+    // Align (round) the position to the nearest existing grid point
+    // on this refinement level
+    ivect const str = baseextent(ml,rl).stride();
+    aligned_ipos = ivect(floor(rpos / rvect(str) + rvect(0.5))) * str;
+    
+    gh::cregs const & regs = superregions.AT(rl);
+    
+    // Search all superregions linearly.  Each superregion corresponds
+    // to a "refined region", and the number of superregions is thus
+    // presumably independent of the number of processors.
+    for (size_t r = 0; r < regs.size(); ++r) {
+      region_t const & reg = regs.AT(r);
+      if (reg.extent.contains(aligned_ipos)) {
+        // We found the superregion to which this grid point belongs
+        
+        // Search the superregion hierarchically
+        pseudoregion_t const * const preg =
+          reg.processors->search(aligned_ipos);
+        assert (preg);
+        
+        // We now know the refinement level, component, and index to
+        // which this grid point belongs
+        c = preg->component;
+        return;
+      }
+    }
+  } // for rl
+  
+  // The point does not belong to any component on any refinement
+  // level
+  rl = -1;
+  c = -1;
+}
+
+void
+gh::
+locate_position (ivect const & ipos,
+                 int const ml,
+                 int const minrl, int const maxrl,
+                 int & rl, int & c, ivect & aligned_ipos) const
+{
+  assert (ml>=0 and ml<mglevels());
+  assert (minrl>=0 and minrl<=maxrl and maxrl<=reflevels());
+  
+  // Try finer levels first
+  for (rl = maxrl-1; rl >= minrl; --rl) {
+    
+    // Align (round) the position to the nearest existing grid point
+    // on this refinement level
+    ivect const str = baseextent(ml, rl).stride();
+    aligned_ipos = ivect(floor(rvect(ipos) / rvect(str) + rvect(0.5))) * str;
+    
+    gh::cregs const & regs = superregions.AT(rl);
+    
+    // Search all superregions linearly.  Each superregion corresponds
+    // to a "refined region", and the number of superregions is thus
+    // presumably independent of the number of processors.
+    for (size_t r = 0; r < regs.size(); ++r) {
+      region_t const & reg = regs.AT(r);
+      if (reg.extent.contains(aligned_ipos)) {
+        // We found the superregion to which this grid point belongs
+        
+        // Search the superregion hierarchically
+        pseudoregion_t const * const preg =
+          reg.processors->search(aligned_ipos);
+        assert (preg);
+        
+        // We now know the refinement level, component, and index to
+        // which this grid point belongs
+        c = preg->component;
+        return;
+      }
+    }
+  } // for rl
+  
+  // The point does not belong to any component on any refinement
+  // level
+  rl = -1;
+  c = -1;
+}
+
+
+
 // Time hierarchy management
 
 void
diff --git a/Carpet/CarpetLib/src/gh.hh b/Carpet/CarpetLib/src/gh.hh
index ffac38804..b80d71ca3 100644
--- a/Carpet/CarpetLib/src/gh.hh
+++ b/Carpet/CarpetLib/src/gh.hh
@@ -128,6 +128,16 @@ public:
   
   int local_components (const int rl) const;
   
+  void locate_position (rvect const & rpos,
+                        int const ml,
+                        int const minrl, int const maxrl,
+                        int & rl, int & c, ivect & aligned_ipos) const;
+  
+  void locate_position (ivect const & ipos,
+                        int const ml,
+                        int const minrl, int const maxrl,
+                        int & rl, int & c, ivect & aligned_ipos) const;
+  
   // Time hierarchy management
   void add (th * t);
   void remove (th * t);
diff --git a/Carpet/CarpetLib/src/prolongate_3d_o11_rf2.cc b/Carpet/CarpetLib/src/prolongate_3d_o11_rf2.cc
index 020158d4b..d731d524d 100644
--- a/Carpet/CarpetLib/src/prolongate_3d_o11_rf2.cc
+++ b/Carpet/CarpetLib/src/prolongate_3d_o11_rf2.cc
@@ -35,20 +35,19 @@ namespace CarpetLib {
   RT
   coeff (int const i)
   {
-    RT const one = 1;
     static const RT coeffs[ncoeffs] = {
-           63/one*524288,
-      -   819/one*524288,
-         5005/one*524288,
-      - 19305/one*524288,
-        27027/one*262144,
-      - 63063/one*262144,
-       189189/one*262144,
-       135135/one*262144,
-      - 45045/one*524288,
-         9009/one*524288,
-      -  1287/one*524288,
-           91/one*524288
+           63/RT(524288.0),
+      -   819/RT(524288.0),
+         5005/RT(524288.0),
+      - 19305/RT(524288.0),
+        27027/RT(262144.0),
+      - 63063/RT(262144.0),
+       189189/RT(262144.0),
+       135135/RT(262144.0),
+      - 45045/RT(524288.0),
+         9009/RT(524288.0),
+      -  1287/RT(524288.0),
+           91/RT(524288.0)
     };
     return coeffs[i];
   }
@@ -74,7 +73,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp0 (p + i*d1);
+      res += coeff<RT>(i) * interp0<T> (p + i*d1);
     }
     return res;
   }
@@ -90,7 +89,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp1 (p + i*d2, d1);
+      res += coeff<RT>(i) * interp1<T> (p + i*d2, d1);
     }
     return res;
   }
@@ -107,7 +106,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp2 (p + i*d3, d1, d2);
+      res += coeff<RT>(i) * interp2<T> (p + i*d3, d1, d2);
     }
     return res;
   }
@@ -245,7 +244,7 @@ namespace CarpetLib {
     
     // kernel
    l8000:
-    dst[DSTIND3(id,jd,kd)] = interp0 (& src[SRCIND3(is,js,ks)]);
+    dst[DSTIND3(id,jd,kd)] = interp0<T> (& src[SRCIND3(is,js,ks)]);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8001;
@@ -253,7 +252,7 @@ namespace CarpetLib {
     
     // kernel
    l8001:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is-3,js,ks)], srcdi);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is-3,js,ks)], srcdi);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -277,7 +276,7 @@ namespace CarpetLib {
     
     // kernel
    l8010:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is,js-3,ks)], srcdj);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is,js-3,ks)], srcdj);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8011;
@@ -286,7 +285,7 @@ namespace CarpetLib {
     // kernel
    l8011:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is-3,js-3,ks)], srcdi, srcdj);
+      interp2<T> (& src[SRCIND3(is-3,js-3,ks)], srcdi, srcdj);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -326,7 +325,7 @@ namespace CarpetLib {
     
     // kernel
    l8100:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is,js,ks-3)], srcdk);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is,js,ks-3)], srcdk);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8101;
@@ -335,7 +334,7 @@ namespace CarpetLib {
     // kernel
    l8101:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is-3,js,ks-3)], srcdi, srcdj);
+      interp2<T> (& src[SRCIND3(is-3,js,ks-3)], srcdi, srcdj);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -360,7 +359,7 @@ namespace CarpetLib {
     // kernel
    l8110:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is,js-3,ks-3)], srcdj, srcdk);
+      interp2<T> (& src[SRCIND3(is,js-3,ks-3)], srcdj, srcdk);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8111;
@@ -370,7 +369,7 @@ namespace CarpetLib {
    l8111:
     {
       dst[DSTIND3(id,jd,kd)] =
-        interp3 (& src[SRCIND3(is-3,js-3,ks-3)], srcdi, srcdj, srcdk);
+        interp3<T> (& src[SRCIND3(is-3,js-3,ks-3)], srcdi, srcdj, srcdk);
     }
     i = i+1;
     id = id+1;
diff --git a/Carpet/CarpetLib/src/prolongate_3d_o7_rf2.cc b/Carpet/CarpetLib/src/prolongate_3d_o7_rf2.cc
index fcf4d710f..a7341139f 100644
--- a/Carpet/CarpetLib/src/prolongate_3d_o7_rf2.cc
+++ b/Carpet/CarpetLib/src/prolongate_3d_o7_rf2.cc
@@ -35,16 +35,15 @@ namespace CarpetLib {
   RT
   coeff (int const i)
   {
-    RT const one = 1;
     static const RT coeffs[ncoeffs] = {
-      -   5*one/2048,
-         49*one/2048,
-      - 245*one/2048,
-       1225*one/2048,
-       1225*one/2048,
-      - 245*one/2048,
-         49*one/2048,
-      -   5*one/2048
+      -   5/RT(2048.0),
+         49/RT(2048.0),
+      - 245/RT(2048.0),
+       1225/RT(2048.0),
+       1225/RT(2048.0),
+      - 245/RT(2048.0),
+         49/RT(2048.0),
+      -   5/RT(2048.0)
     };
     return coeffs[i];
   }
@@ -70,7 +69,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp0 (p + i*d1);
+      res += coeff<RT>(i) * interp0<T> (p + i*d1);
     }
     return res;
   }
@@ -86,7 +85,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp1 (p + i*d2, d1);
+      res += coeff<RT>(i) * interp1<T> (p + i*d2, d1);
     }
     return res;
   }
@@ -103,7 +102,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp2 (p + i*d3, d1, d2);
+      res += coeff<RT>(i) * interp2<T> (p + i*d3, d1, d2);
     }
     return res;
   }
@@ -241,7 +240,7 @@ namespace CarpetLib {
     
     // kernel
    l8000:
-    dst[DSTIND3(id,jd,kd)] = interp0 (& src[SRCIND3(is,js,ks)]);
+    dst[DSTIND3(id,jd,kd)] = interp0<T> (& src[SRCIND3(is,js,ks)]);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8001;
@@ -249,7 +248,7 @@ namespace CarpetLib {
     
     // kernel
    l8001:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is-3,js,ks)], srcdi);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is-3,js,ks)], srcdi);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -273,7 +272,7 @@ namespace CarpetLib {
     
     // kernel
    l8010:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is,js-3,ks)], srcdj);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is,js-3,ks)], srcdj);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8011;
@@ -282,7 +281,7 @@ namespace CarpetLib {
     // kernel
    l8011:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is-3,js-3,ks)], srcdi, srcdj);
+      interp2<T> (& src[SRCIND3(is-3,js-3,ks)], srcdi, srcdj);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -322,7 +321,7 @@ namespace CarpetLib {
     
     // kernel
    l8100:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is,js,ks-3)], srcdk);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is,js,ks-3)], srcdk);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8101;
@@ -331,7 +330,7 @@ namespace CarpetLib {
     // kernel
    l8101:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is-3,js,ks-3)], srcdi, srcdj);
+      interp2<T> (& src[SRCIND3(is-3,js,ks-3)], srcdi, srcdj);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -356,7 +355,7 @@ namespace CarpetLib {
     // kernel
    l8110:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is,js-3,ks-3)], srcdj, srcdk);
+      interp2<T> (& src[SRCIND3(is,js-3,ks-3)], srcdj, srcdk);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8111;
@@ -366,7 +365,7 @@ namespace CarpetLib {
    l8111:
     {
       dst[DSTIND3(id,jd,kd)] =
-        interp3 (& src[SRCIND3(is-3,js-3,ks-3)], srcdi, srcdj, srcdk);
+        interp3<T> (& src[SRCIND3(is-3,js-3,ks-3)], srcdi, srcdj, srcdk);
     }
     i = i+1;
     id = id+1;
diff --git a/Carpet/CarpetLib/src/prolongate_3d_o9_rf2.cc b/Carpet/CarpetLib/src/prolongate_3d_o9_rf2.cc
index 8e2d6fc18..cd0d6038b 100644
--- a/Carpet/CarpetLib/src/prolongate_3d_o9_rf2.cc
+++ b/Carpet/CarpetLib/src/prolongate_3d_o9_rf2.cc
@@ -35,18 +35,17 @@ namespace CarpetLib {
   RT
   coeff (int const i)
   {
-    RT const one = 1;
     static const RT coeffs[ncoeffs] = {
-      -   35*one/65536,
-         385*one/65536,
-      -  495*one/16384,
-        1617*one/16384,
-      - 8085*one/32768,
-       24255*one/32768,
-        8085*one/16384,
-      - 1155*one/16384,
-         693*one/65536,
-      -   55*one/65536
+      -   35/RT(65536.0),
+         385/RT(65536.0),
+      -  495/RT(16384.0),
+        1617/RT(16384.0),
+      - 8085/RT(32768.0),
+       24255/RT(32768.0),
+        8085/RT(16384.0),
+      - 1155/RT(16384.0),
+         693/RT(65536.0),
+      -   55/RT(65536.0)
     };
     return coeffs[i];
   }
@@ -72,7 +71,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp0 (p + i*d1);
+      res += coeff<RT>(i) * interp0<T> (p + i*d1);
     }
     return res;
   }
@@ -88,7 +87,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp1 (p + i*d2, d1);
+      res += coeff<RT>(i) * interp1<T> (p + i*d2, d1);
     }
     return res;
   }
@@ -105,7 +104,7 @@ namespace CarpetLib {
     typedef typename typeprops<T>::real RT;
     T res = typeprops<T>::fromreal (0);
     for (int i=0; i<ncoeffs; ++i) {
-      res += coeff<RT>(i) * interp2 (p + i*d3, d1, d2);
+      res += coeff<RT>(i) * interp2<T> (p + i*d3, d1, d2);
     }
     return res;
   }
@@ -243,7 +242,7 @@ namespace CarpetLib {
     
     // kernel
    l8000:
-    dst[DSTIND3(id,jd,kd)] = interp0 (& src[SRCIND3(is,js,ks)]);
+    dst[DSTIND3(id,jd,kd)] = interp0<T> (& src[SRCIND3(is,js,ks)]);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8001;
@@ -251,7 +250,7 @@ namespace CarpetLib {
     
     // kernel
    l8001:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is-3,js,ks)], srcdi);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is-3,js,ks)], srcdi);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -275,7 +274,7 @@ namespace CarpetLib {
     
     // kernel
    l8010:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is,js-3,ks)], srcdj);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is,js-3,ks)], srcdj);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8011;
@@ -284,7 +283,7 @@ namespace CarpetLib {
     // kernel
    l8011:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is-3,js-3,ks)], srcdi, srcdj);
+      interp2<T> (& src[SRCIND3(is-3,js-3,ks)], srcdi, srcdj);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -324,7 +323,7 @@ namespace CarpetLib {
     
     // kernel
    l8100:
-    dst[DSTIND3(id,jd,kd)] = interp1 (& src[SRCIND3(is,js,ks-3)], srcdk);
+    dst[DSTIND3(id,jd,kd)] = interp1<T> (& src[SRCIND3(is,js,ks-3)], srcdk);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8101;
@@ -333,7 +332,7 @@ namespace CarpetLib {
     // kernel
    l8101:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is-3,js,ks-3)], srcdi, srcdj);
+      interp2<T> (& src[SRCIND3(is-3,js,ks-3)], srcdi, srcdj);
     i = i+1;
     id = id+1;
     is = is+1;
@@ -358,7 +357,7 @@ namespace CarpetLib {
     // kernel
    l8110:
     dst[DSTIND3(id,jd,kd)] =
-      interp2 (& src[SRCIND3(is,js-3,ks-3)], srcdj, srcdk);
+      interp2<T> (& src[SRCIND3(is,js-3,ks-3)], srcdj, srcdk);
     i = i+1;
     id = id+1;
     if (i < regiext) goto l8111;
@@ -368,7 +367,7 @@ namespace CarpetLib {
    l8111:
     {
       dst[DSTIND3(id,jd,kd)] =
-        interp3 (& src[SRCIND3(is-3,js-3,ks-3)], srcdi, srcdj, srcdk);
+        interp3<T> (& src[SRCIND3(is-3,js-3,ks-3)], srcdi, srcdj, srcdk);
     }
     i = i+1;
     id = id+1;
diff --git a/Carpet/CarpetReduce/interface.ccl b/Carpet/CarpetReduce/interface.ccl
index 71b96c3a6..e19087aa9 100644
--- a/Carpet/CarpetReduce/interface.ccl
+++ b/Carpet/CarpetReduce/interface.ccl
@@ -14,12 +14,28 @@ CCTK_INT FUNCTION \
     SymmetryTableHandleForGrid (CCTK_POINTER_TO_CONST IN cctkGH)
 REQUIRES FUNCTION SymmetryTableHandleForGrid
 
-CCTK_INT FUNCTION GetBoundarySpecification \
-  (CCTK_INT IN size, \
-   CCTK_INT OUT ARRAY nboundaryzones, \
-   CCTK_INT OUT ARRAY is_internal, \
-   CCTK_INT OUT ARRAY is_staggered, \
-   CCTK_INT OUT ARRAY shiftout)
+CCTK_INT FUNCTION     \
+    MultiPatch_GetMap \
+        (CCTK_POINTER_TO_CONST IN cctkGH)
+USES FUNCTION MultiPatch_GetMap
+
+CCTK_INT FUNCTION                           \
+    MultiPatch_GetBoundarySpecification     \
+        (CCTK_INT IN map,                   \
+         CCTK_INT IN size,                  \
+         CCTK_INT OUT ARRAY nboundaryzones, \
+         CCTK_INT OUT ARRAY is_internal,    \
+         CCTK_INT OUT ARRAY is_staggered,   \
+         CCTK_INT OUT ARRAY shiftout)
+USES FUNCTION MultiPatch_GetBoundarySpecification
+
+CCTK_INT FUNCTION                           \
+    GetBoundarySpecification                \
+        (CCTK_INT IN size,                  \
+         CCTK_INT OUT ARRAY nboundaryzones, \
+         CCTK_INT OUT ARRAY is_internal,    \
+         CCTK_INT OUT ARRAY is_staggered,   \
+         CCTK_INT OUT ARRAY shiftout)
 REQUIRES FUNCTION GetBoundarySpecification
 
 
diff --git a/Carpet/CarpetReduce/src/mask_coords.c b/Carpet/CarpetReduce/src/mask_coords.c
index 2b7d706bd..6ea6d52ea 100644
--- a/Carpet/CarpetReduce/src/mask_coords.c
+++ b/Carpet/CarpetReduce/src/mask_coords.c
@@ -24,8 +24,15 @@ CoordBase_SetupMask (CCTK_ARGUMENTS)
   
   
   
-  ierr = GetBoundarySpecification
-    (6, nboundaryzones, is_internal, is_staggered, shiftout);
+  if (CCTK_IsFunctionAliased ("MultiPatch_GetBoundarySpecification")) {
+    int const m = MultiPatch_GetMap (cctkGH);
+    assert (m >= 0);
+    ierr = MultiPatch_GetBoundarySpecification
+      (m, 6, nboundaryzones, is_internal, is_staggered, shiftout);
+  } else {
+    ierr = GetBoundarySpecification
+      (6, nboundaryzones, is_internal, is_staggered, shiftout);
+  }
   if (ierr != 0) {
     CCTK_WARN (0, "Could not get boundary specification");
   }
diff --git a/Carpet/CarpetReduce/src/reduce.cc b/Carpet/CarpetReduce/src/reduce.cc
index c7b584b6f..3034d72ef 100644
--- a/Carpet/CarpetReduce/src/reduce.cc
+++ b/Carpet/CarpetReduce/src/reduce.cc
@@ -776,22 +776,24 @@ namespace CarpetReduce {
     const MPI_Datatype mpitype = CarpetSimpleMPIDatatype(outtype);
     const int mpilength = CarpetSimpleMPIDatatypeLength(outtype);
     if (proc == -1) {
-      MPI_Allreduce ((void*)myoutvals, outvals, mpilength*num_outvals,
+      MPI_Allreduce (const_cast<void*>(myoutvals), outvals,
+                     mpilength*num_outvals,
 		     mpitype, red->mpi_op(),
 		     CarpetMPIComm());
       if (red->uses_cnt()) {
-	MPI_Allreduce ((void*)mycounts, &counts[0], num_outvals*mpilength,
+	MPI_Allreduce (const_cast<void*>(mycounts), &counts[0],
+                       num_outvals*mpilength,
 		       mpitype, MPI_SUM,
 		       CarpetMPIComm());
       }
     } else {
-      MPI_Reduce ((void*)myoutvals, outvals, num_outvals*mpilength,
-		  mpitype, red->mpi_op(),
-		  proc, CarpetMPIComm());
+      MPI_Reduce (const_cast<void*>(myoutvals), outvals,
+                  num_outvals*mpilength,
+		  mpitype, red->mpi_op(), proc, CarpetMPIComm());
       if (red->uses_cnt()) {
-	MPI_Reduce ((void*)mycounts, &counts[0], num_outvals*mpilength,
-		    mpitype, MPI_SUM,
-		    proc, CarpetMPIComm());
+	MPI_Reduce (const_cast<void*>(mycounts), &counts[0],
+                    num_outvals*mpilength,
+		    mpitype, MPI_SUM, proc, CarpetMPIComm());
       }
     }
     
diff --git a/Carpet/CarpetRegrid/src/automatic.cc b/Carpet/CarpetRegrid/src/automatic.cc
index 442224f2c..7248b732a 100644
--- a/Carpet/CarpetRegrid/src/automatic.cc
+++ b/Carpet/CarpetRegrid/src/automatic.cc
@@ -50,7 +50,7 @@ namespace CarpetRegrid {
       = (*dynamic_cast<const gf<CCTK_REAL>*>
          (arrdata.at(gi).at(Carpet::map).data.at(vi-v1)));
     
-    assert (! smart_outer_boundaries);
+    assert (not smart_outer_boundaries);
     
     vector<region_t> regs;
     Automatic_OneLevel
diff --git a/Carpet/CarpetSlab/src/Get.cc b/Carpet/CarpetSlab/src/Get.cc
index 09f36a7ab..f0c94821d 100644
--- a/Carpet/CarpetSlab/src/Get.cc
+++ b/Carpet/CarpetSlab/src/Get.cc
@@ -30,7 +30,7 @@ namespace CarpetSlab {
     // Check arguments
     assert (cctkGH);
     assert (mapping_handle>=0);
-    assert (proc==-1 || proc>=0 && proc<CCTK_nProcs(cctkGH));
+    assert (proc==-1 || (proc>=0 && proc<CCTK_nProcs(cctkGH)));
     assert (vindex>=0 && vindex<CCTK_NumVars());
     assert (timelevel>=0);
     assert (hdatatype>=0);
diff --git a/Carpet/CarpetWeb/publications.html b/Carpet/CarpetWeb/publications.html
index c67ec709d..2278c90c9 100644
--- a/Carpet/CarpetWeb/publications.html
+++ b/Carpet/CarpetWeb/publications.html
@@ -300,6 +300,16 @@ Palenzuela, Erik Schnetter, Manuel Tiglio,<br />
 </li>
 
 <li>
+  <!-- received 2006-12-26 -->
+  <p>Comparisons of binary black hole merger waveforms,<br />
+    <i>John G. Baker, Manuela Campanelli, Frans Pretorius, Yosef
+    Zlochower,</i><br />
+    <a href="http://dx.doi.org/10.1088/0264-9381/24/12/S03">Class. Quantum
+      Grav. <b>24</b>, S25-S31 (2007)</a>,<br />
+    <a href="http://arxiv.org/abs/gr-qc/0701016">arXiv:gr-qc/0701016</a>.</p>
+</li>
+
+<li>
 <!-- Herrmann:2006ks -->
 <!-- received 2007-01-04 -->
 <p>Frank Herrmann, Ian Hinder, Deirdre M. Shoemaker, Pablo Laguna,<br />
author	Erik Schnetter <schnetter@cct.lsu.edu>	2008-07-22 13:47:09 -0500
committer	Erik Schnetter <schnetter@cct.lsu.edu>	2008-07-22 13:47:09 -0500
commit	b4da2bc7694fff331465ce0185daf70b126a0793 (patch)
tree	5abefedf02bcd4842fe424b6e3809a6a896a5382
parent	679c409c327078bb41481fba8757063e29cf5525 (diff)
parent	5c20bc1bd05c8d870508d887de4fbe9a04a61e39 (diff)